#!/usr/bin/env python # -*- coding: utf-8 -*- # Copyright (C) 2023 Free Software Foundation # This program is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # This program is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # You should have received a copy of the GNU General Public License # along with this program. If not, see . from debian import changelog import pandas as pd import os import sys from dateutil import parser import subprocess def import_one(pkgname, fh): try: c = changelog.Changelog(fh) date = parser.parse(c.date).strftime('%Y-%m-%d') df = pd.DataFrame([{'_srcpkg':c.package, 'version':c.version, 'date':date, 'author':c.author}]) except: return return (df) def get_pkgname(path): (dir, base) = os.path.split(path) if base in ('current', 'stable_changelog'): return get_pkgname(dir) else: return base def main(): versions = [] for path in subprocess.check_output("find metadata.ftp-master.debian.org -name stable_changelog".split()).strip().split(): pkgname = get_pkgname(path) print pkgname, path data = import_one(pkgname, file(path)) if data is not None: versions.append(data) versions = pd.concat(versions) print versions store = pd.HDFStore('cl.h5') store['cl_versions'] = versions store.close() if __name__ == '__main__': main()