WorkCSV.py
3.82 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
#!/usr/bin/python
# -*- coding: utf-8 -*-
#Autor: Erickson Silva <erickson.silva@lavid.ufpb.br> <ericksonsilva@live.com>
import os, csv, sys
class WorkCSV(object):
# Define e inicializa os atributos
def __init__(self):
self.__path = "vlibras_user/vlibras-core/data/"
self.__fileInf = ''
self.__dicInf = {}
self.__fileSin = ''
self.__dicSin = {}
self.__fileWords = ''
self.__dicWords = {}
self.__file2Gen = ''
self.__dic2Gen = {}
self.__fileTemVerbs = ''
self.__dicTemVerbs = {}
self.createDicInf()
self.createDicSin()
self.createDicWords()
self.createDic2Gen()
self.createDicTemVerbs()
# Abre o arquivo que contem os verbos no infinitivo e preenche o dicionario com os mesmos
def createDicInf(self):
try:
self.__fileInf = csv.reader(open(self.__path+"dicPortGlosa.csv"), delimiter=";")
except IOError, (errno, strerror):
print "I/O error(%s): %s" % (errno, strerror)
print "createDicInf"
for row in self.__fileInf:
if row[1] != "":
try:
self.__dicInf[row[0].decode("utf-8")] = row[1].decode("utf-8")
except UnicodeDecodeError:
self.__dicInf[row[0].decode('iso8859-1').encode('utf-8')] = row[1].decode('iso8859-1').encode('utf-8')
# Abre o arquivo que contem os sinonimos e preenche o dicionario com os mesmos
def createDicSin(self):
try:
self.__fileSin = csv.reader(open(self.__path+"portuguesGlosa.csv"), delimiter=";")
except IOError, (errno, strerror):
print "I/O error(%s): %s" % (errno, strerror)
print "createDicSin"
for row in self.__fileSin:
if row[1] != "":
self.__dicSin[row[0].decode("utf-8")] = row[1].decode("utf-8")
# Abre o arquivo que contem os tempos verbais
def createDicTemVerbs(self):
try:
self.__fileTemVerbs = csv.reader(open(self.__path+"temposVerbais.csv"), delimiter=";")
except IOError, (errno, strerror):
print "I/O error(%s): %s" % (errno, strerror)
print "createDicTemVerbs"
for row in self.__fileTemVerbs:
self.__dicTemVerbs[row[0].decode("utf-8")] = row[0].decode("utf-8")
# Abre o arquivo que contem os artigos e preposicoes de acordo com o modelo de idioma passado na chamada e preenche o dicionario com os mesmos
def createDicWords(self):
try:
self.__fileWords = csv.reader(open(self.__path+"hWordsRemove.csv"), delimiter=";")
except IOError, (errno, strerror):
print "I/O error(%s): %s" % (errno, strerror)
print "createDicWords"
for row in self.__fileWords:
self.__dicWords[row[0].decode("utf-8")] = row[0].decode("utf-8")
# Abre o arquivo que contem os substantivos que sao comuns dos 2 generos e preenche o dicionario com os mesmos
def createDic2Gen(self):
try:
self.__file2Gen = csv.reader(open(self.__path+"subs2Generos.csv"), delimiter=";")
except IOError, (errno, strerror):
print "I/O error(%s): %s" % (errno, strerror)
print "createDic2Gen"
for row in self.__file2Gen:
self.__dic2Gen[row[0].decode("utf-8")] = row[0].decode("utf-8")
# Retorna o dicionario dos verbos no infinitivo
def getDicInf(self):
return self.__dicInf
# Retorna o dicionario dos sinonimos
def getDicSin(self):
return self.__dicSin
# Retorna o dicionario dos artigos e preposicoes a serem removidos pelo simplificador
def getDicWords(self):
return self.__dicWords
# Retorna o dicionario dos substantivos a serem analisados pelo simplificador
def getDic2Gen(self):
return self.__dic2Gen
# Retorna o dicionario dos tempos verbais
def getDicTemVerbs(self):
return self.__dicTemVerbs