gadict: comparison py/gadict.py

equal deleted inserted replaced

-:802f3f9c7ea6
+:b1f11eff7c70
 def __repr__(self):
 return "<Headword {}>".format(self.headword)
 class Sense:
-def __init__(self, pos, tr_list = None, ex_list = None, glos_list = None, ant_list = None, syn_list = None, rel_list = None, topic_list = None, hyper_list = None, hypo_list = None, col_list = None):
+def __init__(self, pos, tr_list = None, ex_list = None, glos_list = None, ant_list = None, syn_list = None, rel_list = None, topic_list = None, hyper_list = None, hypo_list = None, col_list = None, countable = None):
 if not pos:
 raise ParseException("Part of speech expected...\n")
 self.pos = pos
 self.tr_list = tr_list
 self.ex_list = ex_list
 self.rel_list = rel_list
 self.topic_list = topic_list
 self.hyper_list = hyper_list
 self.hypo_list = hypo_list
 self.col_list = col_list
+self.countable = countable
 def add_tr(self, tr):
 if self.tr_list:
 self.tr_list.append(tr)
 else:
 def add_col(self, col):
 if self.col_list:
 self.col_list.append(col)
 else:
 self.col_list = [col]
+def set_countable(self, countable):
+if isinstance(countable, str):
+if countable == 'yes':
+self.countable = True
+elif countable == 'no':
+self.countable = False
+else:
+raise ParseException("Countable can only be yes/no.")
+elif isinstance(countable, bool):
+self.countable = countable
+else:
+raise ParseException("Countable can only be yes/no or bool.")
 def __str__(self):
 if tr_list:
 (lang, text) = self.tr_list[0]
 return "{}: {}".format(lang, text)
 HEADWORD_HOMO_RE = re.compile(u"^ +homo: (\\w|\\w[-'\\w ;]*\\w)$", re.UNICODE)
 TRANSL_POS_RE = re.compile(u"^(?:n|det|pron|adj|v|adv|prep|conj|num|int|phr|phr\\.v|contr|abbr|prefix)$", re.UNICODE)
 TRANSL_RE = re.compile(u"^(ru|uk|la|en): ([\\w(].*)$", re.UNICODE)
 TRANSL_EX_RE = re.compile(u"""^(ru|uk|la|en)> ([-'"\\w].*)$""", re.UNICODE)
 TRANSL_GLOS_RE = re.compile(u"^(ru|uk|la|en)= ([-\\w\\d].*)$", re.UNICODE)
+CNT_RE = re.compile(u"^cnt: (yes|no)$", re.UNICODE)
 TOPIC_RE = re.compile(u"^topic: (\\w.*)$", re.UNICODE)
 SYN_RE = re.compile(u"^syn: (\\w.*)$", re.UNICODE)
 ANT_RE = re.compile(u"^ant: (\\w.*)$", re.UNICODE)
 REL_RE = re.compile(u"^rel: (\\w.*)$", re.UNICODE)
 HYPER_RE = re.compile(u"^hyper: (\\w.*)$", re.UNICODE)
 pos = m.group(0)
 sense = Sense(pos)
 continue
 if not sense:
 raise ParseException("""Missing part of speech marker...""")
+m = self.CNT_RE.match(self.line)
+if m is not None:
+sense.set_countable(m.group(1))
+continue
 m = self.TOPIC_RE.match(self.line)
 if m is not None:
 topics = m.group(1).split(";")
 for topic in topics:
 topic = topic.strip()

changeset 1006	b1f11eff7c70
parent 984	73d6e2631338
child 1011	fdf5640f221a