@@ -63,72 +63,7 @@ def finalize(self):
63
63
pass
64
64
65
65
def process_tu (self , tu , num_of_finished_scans ):
66
- minus_points = 0
67
-
68
- # - Dates ----------------------------------------------------------------
69
- src_dates = len (self .date_re .findall (tu .src_phrase ))
70
- trg_dates = len (self .date_re .findall (tu .trg_phrase ))
71
- if src_dates != trg_dates :
72
- minus_points += 1
73
- # print "date"
74
-
75
- tu .src_phrase = self .date_re .sub ("" , tu .src_phrase )
76
- tu .trg_phrase = self .date_re .sub ("" , tu .trg_phrase )
77
-
78
- # - Numbers --------------------------------------------------------------
79
- src_nums = len (self .num_re .findall (tu .src_phrase ))
80
- trg_nums = len (self .num_re .findall (tu .trg_phrase ))
81
- if src_nums != trg_nums :
82
- minus_points += 1
83
- # print "num"
84
- # print tu.src_phrase
85
- # print tu.trg_phrase
86
-
87
- # - Reference tags -------------------------------------------------------
88
- src_ref = len (self .ref_re .findall (tu .src_phrase ))
89
- trg_ref = len (self .ref_re .findall (tu .trg_phrase ))
90
- if src_ref != trg_ref :
91
- minus_points += 1
92
- # print "ref"
93
-
94
- tu .src_phrase = self .ref_re .sub ("" , tu .src_phrase )
95
- tu .trg_phrase = self .ref_re .sub ("" , tu .trg_phrase )
96
-
97
- # - XML tags -------------------------------------------------------------
98
- src_xml_tag = len (self .xml_re .findall (tu .src_phrase ))
99
- trg_xml_tag = len (self .xml_re .findall (tu .trg_phrase ))
100
- if src_xml_tag != trg_xml_tag :
101
- minus_points += 1
102
- # print "xml"
103
-
104
- # - Emails ---------------------------------------------------------------
105
- src_emails = len (self .email_re .findall (tu .src_phrase ))
106
- trg_emails = len (self .email_re .findall (tu .trg_phrase ))
107
- if src_emails != trg_emails :
108
- minus_points += 1
109
- # print "email"
110
-
111
- # - URLs -----------------------------------------------------------------
112
- src_urls = len (self .url_re .findall (tu .src_phrase ))
113
- trg_urls = len (self .url_re .findall (tu .trg_phrase ))
114
- if src_urls != trg_urls :
115
- minus_points += 1
116
- # print "url"
117
-
118
- # - Image tags -----------------------------------------------------------
119
- src_img_tag = len (self .image_re .findall (tu .src_phrase ))
120
- trg_img_tag = len (self .image_re .findall (tu .trg_phrase ))
121
- if src_img_tag != trg_img_tag :
122
- minus_points += 1
123
- # print "img"
124
-
125
- # - Category tags --------------------------------------------------------
126
- src_cat_tag = len (self .category_re .findall (tu .src_phrase ))
127
- trg_cat_tag = len (self .category_re .findall (tu .trg_phrase ))
128
- if src_cat_tag != trg_cat_tag :
129
- minus_points += 1
130
- # print "cat"
131
-
66
+ minus_points = self .find_mismatches (tu )
132
67
if minus_points > 1 :
133
68
return [0 ]
134
69
return [1 ]
@@ -137,14 +72,19 @@ def do_after_a_full_scan(self, num_of_finished_scans):
137
72
pass
138
73
139
74
def decide (self , tu ):
140
- minus_points = 0
75
+ minus_points = self . find_mismatches ( tu )
141
76
77
+ if minus_points > 1 :
78
+ return 'reject'
79
+ return 'accept'
80
+
81
+ def find_mismatches (self , tu ):
82
+ minus_points = 0
142
83
# - Dates ----------------------------------------------------------------
143
84
src_dates = len (self .date_re .findall (tu .src_phrase ))
144
85
trg_dates = len (self .date_re .findall (tu .trg_phrase ))
145
86
if src_dates != trg_dates :
146
87
minus_points += 1
147
- # print "date"
148
88
149
89
tu .src_phrase = self .date_re .sub ("" , tu .src_phrase )
150
90
tu .trg_phrase = self .date_re .sub ("" , tu .trg_phrase )
@@ -154,16 +94,12 @@ def decide(self, tu):
154
94
trg_nums = len (self .num_re .findall (tu .trg_phrase ))
155
95
if src_nums != trg_nums :
156
96
minus_points += 1
157
- # print "num"
158
- # print tu.src_phrase
159
- # print tu.trg_phrase
160
97
161
98
# - Reference tags -------------------------------------------------------
162
99
src_ref = len (self .ref_re .findall (tu .src_phrase ))
163
100
trg_ref = len (self .ref_re .findall (tu .trg_phrase ))
164
101
if src_ref != trg_ref :
165
102
minus_points += 1
166
- # print "ref"
167
103
168
104
tu .src_phrase = self .ref_re .sub ("" , tu .src_phrase )
169
105
tu .trg_phrase = self .ref_re .sub ("" , tu .trg_phrase )
@@ -173,46 +109,30 @@ def decide(self, tu):
173
109
trg_xml_tag = len (self .xml_re .findall (tu .trg_phrase ))
174
110
if src_xml_tag != trg_xml_tag :
175
111
minus_points += 1
176
- # print "xml"
177
112
178
113
# - Emails ---------------------------------------------------------------
179
114
src_emails = len (self .email_re .findall (tu .src_phrase ))
180
115
trg_emails = len (self .email_re .findall (tu .trg_phrase ))
181
116
if src_emails != trg_emails :
182
117
minus_points += 1
183
- # print "email"
184
118
185
119
# - URLs -----------------------------------------------------------------
186
120
src_urls = len (self .url_re .findall (tu .src_phrase ))
187
121
trg_urls = len (self .url_re .findall (tu .trg_phrase ))
188
122
if src_urls != trg_urls :
189
123
minus_points += 1
190
- # print "url"
191
124
192
125
# - Image tags -----------------------------------------------------------
193
126
src_img_tag = len (self .image_re .findall (tu .src_phrase ))
194
127
trg_img_tag = len (self .image_re .findall (tu .trg_phrase ))
195
128
if src_img_tag != trg_img_tag :
196
129
minus_points += 1
197
- # print "img"
198
130
199
131
# - Category tags --------------------------------------------------------
200
132
src_cat_tag = len (self .category_re .findall (tu .src_phrase ))
201
133
trg_cat_tag = len (self .category_re .findall (tu .trg_phrase ))
202
134
if src_cat_tag != trg_cat_tag :
203
135
minus_points += 1
204
- # print "cat"
205
136
206
- if src_cat_tag > 0 :
207
- print "category tag -> edit them"
208
- print src_cat_tag
209
- if trg_cat_tag > 0 :
210
- print "category tag -> edit them"
211
- print trg_cat_tag
212
-
213
- # ------------------------------------------------------------------------
214
- # ------------------------------------------------------------------------
137
+ return minus_points
215
138
216
- if minus_points > 1 :
217
- return 'reject'
218
- return 'accept'
0 commit comments