From 2a2a0d49ecccabe971bb0a39e6206bb47cd17168 Mon Sep 17 00:00:00 2001 From: Ruben Rodriguez Date: Fri, 26 Jun 2015 09:50:14 -0500 Subject: Sanitize Upstream-Name header in load_copyright Some dep5 files are malformed and incude the author's name and email on the Upstream-Name field --- load_copyright.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/load_copyright.py b/load_copyright.py index a5b1f5d..1ab361d 100644 --- a/load_copyright.py +++ b/load_copyright.py @@ -83,6 +83,8 @@ def import_one(pkgname, fh): header['Upstream-Name'] = \ header['Upstream-Name'].replace(u'\xa0', ' ') #copy_summary['Upstream-Name'].replace('\xc2\xa0', ' ') + if '@' in header['Upstream-Name']: + header['Upstream-Name'] = pkgname copy_summary = pd.DataFrame([header]) #print copy_summary.T.to_string() -- cgit v1.2.3