aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorDafydd Harries <daf@rhydd.org>2013-03-19 09:28:30 -0400
committerDafydd Harries <daf@rhydd.org>2013-03-19 09:28:30 -0400
commitf5687f4cbff7a06b31f0b24b2269fc09235612b8 (patch)
tree14961ca8eb43beca590b11d566d9841d87ec8870
parenta280d5c69f047f66b88727341c72bcb86463962b (diff)
flag problematic text in descriptions
-rw-r--r--export.py11
1 files changed, 10 insertions, 1 deletions
diff --git a/export.py b/export.py
index 0e69803..c3d9625 100644
--- a/export.py
+++ b/export.py
@@ -76,10 +76,19 @@ def extract_languages(tags):
return list(set(langs))
+def catechise(s):
+ heresies = ["open source", "debian", "(?<!gnu/)linux", "creative commons"]
+ pattern = '\\b(%s)\\b' % '|'.join([h.replace(' ', '.') for h in heresies])
+ return re.sub(pattern,
+ lambda m: '??%s??' % m.group(1).replace('\n', ' '),
+ s,
+ re.DOTALL | re.IGNORECASE)
+
def munge_description(s):
paras = s.split('\n .\n')
return '\n\n'.join(
- textwrap.fill(para.lstrip().replace('\n', ''), 65) for para in paras)
+ catechise(textwrap.fill(para.lstrip().replace('\n', ''), 65))
+ for para in paras)
def get_license_map():
map = {}