diff options
Diffstat (limited to 'load_descriptions.py')
-rw-r--r-- | load_descriptions.py | 12 |
1 files changed, 12 insertions, 0 deletions
diff --git a/load_descriptions.py b/load_descriptions.py new file mode 100644 index 0000000..36d6257 --- /dev/null +++ b/load_descriptions.py @@ -0,0 +1,12 @@ + +import sys + +import debian.deb822 +import pandas as pd + +descs = debian.deb822.Packages.iter_paragraphs(sys.stdin) +df = pd.DataFrame([dict(p) for p in descs]) +store = pd.HDFStore('pkg.h5') +store['descriptions'] = df +store.close() + |