[textsum] Use lib/labeler to unify labels when converting data

Persper · Aug 9, 2017 · f287e37 · f287e37
1 parent 7f2491b
commit f287e37
Showing 1 changed file with 5 additions and 16 deletions.
diff --git a/seq2seq/textsum/convert_data.py b/seq2seq/textsum/convert_data.py
@@ -8,6 +8,10 @@
 import pickle
 import re
 
+import sys
+sys.path.append('../../lib')
+import labeler
+
 # Special tokens
 PARAGRAPH_START = '<p>'
 PARAGRAPH_END = '</p>'
@@ -18,21 +22,6 @@
 DOCUMENT_START = '<d>'
 DOCUMENT_END = '</d>'
 
-# Labels
-BUG = 'bug'
-FEATURE = 'feature'
-PERFORMANCE = 'performance'
-RELIABILITY = 'reliability'
-MAINTENANCE = 'maintenance'
-
-fs_labeler = {
-    'b':BUG,
-    'f':FEATURE,
-    'p':PERFORMANCE,
-    'c':RELIABILITY,
-    'misc':MAINTENANCE,
-}
-
 def to_skip(token):
     return token in '={}<>()[]--' or '=' in token
 
@@ -49,7 +38,7 @@ def get_tokens(string, counter):
     return tokens
 
 def parse_patch(patch):
-    label = fs_labeler[patch['type']]
+    label = FS_LABELER[patch['type']]
     lines = patch['message'].splitlines()
     assert patch['subject'] == lines[0].strip()
     return label, lines