diff --git a/data/adverbiosIntensidade.csv b/data/adverbiosIntensidade.csv new file mode 100644 index 0000000..1c08075 --- /dev/null +++ b/data/adverbiosIntensidade.csv @@ -0,0 +1,6 @@ +muito;muito +demais;muito +pouco;pouco +menos;pouco +melhor;muito +pior;pouco \ No newline at end of file diff --git a/data/artigos.csv b/data/artigos.csv new file mode 100644 index 0000000..ab5b985 --- /dev/null +++ b/data/artigos.csv @@ -0,0 +1,8 @@ +a +as +o +os +um +uns +uma +umas \ No newline at end of file diff --git a/data/preposicoes.csv b/data/preposicoes.csv new file mode 100644 index 0000000..a44bb50 --- /dev/null +++ b/data/preposicoes.csv @@ -0,0 +1,18 @@ +em +na +no +nos +nas +de +da +do +dos +das +por +pelo +pela +pelos +pelas +para +ao +aos \ No newline at end of file diff --git a/data/regras.xml b/data/regras.xml index c680c63..6904846 100644 --- a/data/regras.xml +++ b/data/regras.xml @@ -381,7 +381,7 @@ 1 - + true 1 diff --git a/data/verbosLigacao.csv b/data/verbosLigacao.csv new file mode 100644 index 0000000..064bfcf --- /dev/null +++ b/data/verbosLigacao.csv @@ -0,0 +1,2 @@ +ser +estar \ No newline at end of file diff --git a/src/new/LerDicionarios.py b/src/new/LerDicionarios.py index 75da0f5..357c503 100644 --- a/src/new/LerDicionarios.py +++ b/src/new/LerDicionarios.py @@ -14,7 +14,7 @@ class LerDicionarios(object): def __init__(self): self.path = self.get_path() - self.dic_adv_intensidade = [] + self.dic_adv_intensidade = {} self.dic_adv_tempo = [] self.dic_art = [] self.dic_prep = [] @@ -42,15 +42,14 @@ class LerDicionarios(object): def carregar_adverbios_intensidade(self): try: - self.file = csv.reader(open(self.path+"adverbiosIntensidade.csv")) + self.file = csv.reader(open(self.path+"adverbiosIntensidade.csv"), delimiter=";") except IOError, (errno, strerror): print "I/O error(%s): %s" % (errno, strerror) print "carregar_adverbios_intensidade" - - rows = [] + for row in self.file: - rows.append(row[0].decode("utf-8")) - self.dic_adv_intensidade = set(rows) + if row[1] != "": + self.dic_adv_intensidade[row[0].decode("utf-8")] = row[1].decode("utf-8") def carregar_adverbios_tempo(self): try: @@ -135,7 +134,7 @@ class LerDicionarios(object): self.dic_vb_ligacao = set(rows) def has_adverbio_intensidade(self, token): - return token in self.dic_adv_intensidade + return self.dic_adv_intensidade.has_key(token) def has_adverbio_tempo(self, token): return token in self.dic_adv_tempo @@ -158,6 +157,9 @@ class LerDicionarios(object): def has_verbo_ligacao(self, token): return token in self.dic_vb_ligacao + def get_adverbio_intensidade(self, token): + return self.dic_adv_intensidade[token] + def get_sinonimo(self, token): return self.dic_sin[token] -- libgit2 0.21.2