#!/bin/bash source err set -x x="$(readlink -f -- "$BASH_SOURCE")"; cd ${x%/*} # directory of this file rm -rf distfiles output *.log *.h5 metadata.ftp-master.debian.org mkdir distfiles wget -O - http://ftp.debian.org/debian/dists/stable/main/source/Sources.gz | gunzip >> distfiles/Sources #wget -O - http://ftp.debian.org/debian/dists/stable-updates/main/source/Sources.gz | gunzip >> distfiles/Sources #wget -O - http://security.debian.org/debian-security/dists/stable/updates/main/source/Sources.gz | gunzip >> distfiles/Sources packages=$(grep ^Package: distfiles/Sources |sort -u| sed 's/Package: //') pv distfiles/Sources | python load_sources.py wget -O - http://ftp.debian.org/debian/dists/stable/main/binary-all/Packages.gz | gunzip >> distfiles/Packages wget -O - http://ftp.debian.org/debian/dists/stable/main/binary-amd64/Packages.gz | gunzip >> distfiles/Packages #wget -O - http://ftp.debian.org/debian/dists/stable-updates/main/binary-amd64/Packages.gz | gunzip >> distfiles/Packages #wget -O - http://security.debian.org/debian-security/dists/stable/updates/main/binary-all/Packages.gz | gunzip >> distfiles/Packages pv distfiles/Packages | python load_packages.py wget -O - http://ftp.debian.org/debian/dists/stable/main/i18n/Translation-en.bz2 | bunzip2 >> distfiles/Translation-en #wget -O - http://ftp.debian.org/debian/dists/stable-updates/main/i18n/Translation-en.bz2 | bunzip2 >> distfiles/Translation-en #wget -O - http://security.debian.org/debian-security/dists/stable/updates/main/i18n/Translation-en.bz2 | bunzip2 >> distfiles/Translation-en pv distfiles/Translation-en | python load_descriptions.py rm downloadlist* -f for package in $packages; do letter=$(echo $package |cut -c1) [ 1$(echo $package |cut -c-3) = 1'lib' ] && letter=$(echo $package |cut -c-4) echo http://metadata.ftp-master.debian.org/changelogs/main/$letter/$package/stable_copyright >> downloadlist echo http://metadata.ftp-master.debian.org/changelogs/main/$letter/$package/stable_changelog >> downloadlist done # this may return 8, because debian has removed a package from the time we made downloadlist, to the time we actually did the wget on a url in it # so, we do a check to see if we downloaded at least the number of files - 10 for (( i=0; i<10; i++ )); do if wget -nc -nv -x --continue -i downloadlist; then break fi done # Emailed 490848@bugs.debian.org 2018-07-06 with subject: 30 missing stable_copyright and stable_changelog files -- see https://bugs.debian.org/cgi-bin/bugreport.cgi?bug=490848#51 if [[ $(find metadata.ftp-master.debian.org -type f |wc -l) -lt $(( $(wc -l > downloadlist404 done wget -v -x --continue -i downloadlist404 ||: # all this to fail because this is an effort to workaround the bug above, but it is not perfect python load_copyright.py &> cp_import.log python load_changelog.py &> cl_import.log python export.py python export_json.py echo empty files: > broken find output -type f -empty >> broken find output -type f -empty -delete echo no license: >> broken grep "Project license" output/* -c |grep :0|sed 's/:0//' >> broken grep "Project license" output/* -c |grep :0|sed 's/:0//'|xargs rm