Python Miscelaneous.getStoplist Exemples, Miscelaneous.Miscelaneous.getStoplist Python Exemples

Exemple #1

0

Afficher le fichier

Fichier : StanfordSyntacticContexts.py Projet : rogergranada/ATCP

class StanfordSyntacticContexts:
    def __init__(self, input_folder, temp_folder, stoplist_file, min_word_size,
                 record_intermediate):
        try:
            self.root, self.dirs, self.files = os.walk(input_folder).next()[:3]
        except IOError:
            print bcolors.FAIL + 'ERROR: It was not possible to open the ' + input_folder + ' folder' + bcolors.ENDC
            sys.exit(2)

        self.min_word_size = int(min_word_size)
        self.temp_folder = temp_folder
        self.qty_documents = len(self.files)
        self.misc = Miscelaneous()
        self.stoplist = self.misc.getStoplist(stoplist_file)

        self.matrix_relations = ['AN', 'SV', 'VO']
        self.dic_an = {}
        self.dic_sv = {}
        self.dic_vo = {}

        command = 'rm -Rf ' + self.temp_folder + '; mkdir ' + self.temp_folder + ' '
        if record_intermediate:
            command += self.temp_folder + 'AN/' + ' ' + self.temp_folder + 'AN/2Order/' + self.temp_folder + 'AN/3Order/ '
            command += self.temp_folder + 'SV/' + ' ' + self.temp_folder + 'SV/2Order/' + self.temp_folder + 'SV/3Order/ '
            command += self.temp_folder + 'VO/' + ' ' + self.temp_folder + 'VO/2Order/' + self.temp_folder + 'VO/3Order/ '
        os.system(command)

        i = 0
        for corpus_file in self.files:
            self.dic_t = {}
            self.dic_nt = {}
            self.dic_an_doc = {}
            self.dic_sv_doc = {}
            self.dic_vo_doc = {}
            #print corpus_file
            i += 1
            if re.match('.*xml$', corpus_file):
                corpus_filename = corpus_file.split('.')[0]
                xml = ParseStanfordXml(self.root + '' + corpus_file)
                self.dic_t = xml.getDicTerms()
                self.dic_nt = xml.getDicNonTerminals()
                self.__extractRelations__()
                if record_intermediate:
                    self.__writeDicRelations__(corpus_filename)

            self.misc.progress_bar(i, self.qty_documents, 100)

        self.__writeDic__()

    def __del__(self):
        pass

    def __extractRelations__(self):
        i = 0
        #print self.dic_t
        for id_nt in self.dic_nt:
            if self.dic_nt[id_nt]['cat'] == 'nn':
                noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
                #noun = re.sub('-', '_', noun)
                context = self.dic_t[self.dic_nt[id_nt]
                                     ['dep']]['lemma'].lower()
                context = re.sub('-', '_', context)
                if len(noun) >= self.min_word_size and len(
                        context) >= self.min_word_size:
                    self.__addElementDicAN__(context + '#' + noun)
                    self.__addElementDicAN__(noun + '#' + context)
                    self.__addElementDicDocAN__(context + '#' + noun)
                    self.__addElementDicDocAN__(noun + '#' + context)

            elif self.dic_nt[id_nt]['cat'] == 'amod':
                noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
                #noun = re.sub('-', '_', noun)
                context = self.dic_t[self.dic_nt[id_nt]
                                     ['dep']]['lemma'].lower()
                context = re.sub('-', '_', context)
                if len(noun) >= self.min_word_size and len(
                        context
                ) >= self.min_word_size and context not in self.stoplist:
                    self.__addElementDicAN__(context + '#' + noun)
                    self.__addElementDicDocAN__(context + '#' + noun)

            if re.match('prep_', self.dic_nt[id_nt]['cat']) \
             and re.match('^NN', self.dic_t[self.dic_nt[id_nt]['dep']]['pos'])  \
             and re.match('^NN', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
                noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
                #noun = re.sub('-', '_', noun)
                context = self.dic_t[self.dic_nt[id_nt]
                                     ['dep']]['lemma'].lower()
                context = re.sub('-', '_', context)
                prep = self.dic_nt[id_nt]['cat'].split('_')[1]
                if len(noun) >= self.min_word_size and len(
                        context) >= self.min_word_size:
                    self.__addElementDicAN__(prep + '_' + context + '#' + noun)
                    self.__addElementDicAN__(prep + '_' + noun + '#' + context)
                    self.__addElementDicDocAN__(prep + '_' + context + '#' +
                                                noun)
                    self.__addElementDicDocAN__(prep + '_' + noun + '#' +
                                                context)

            elif re.match('^(nsubjpass|nsubj|xsubj|agent)$',
                          self.dic_nt[id_nt]['cat']):  #gov = verb
                if re.match('V', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
                    verb = self.dic_t[self.dic_nt[id_nt]
                                      ['gov']]['lemma'].lower()
                    #verb = re.sub('-', '_', verb)
                    contexts = self.dic_t[self.dic_nt[id_nt]['dep']]['nps']
                    for context in contexts:
                        if len(verb) >= self.min_word_size and len(
                                context) >= self.min_word_size:
                            self.__addElementDicSV__('sub_' + verb + '#' +
                                                     context)
                            self.__addElementDicDocSV__('sub_' + verb + '#' +
                                                        context)

            elif re.match('^(dobj|iobj)$', self.dic_nt[id_nt]['cat']):
                if re.match('V', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
                    verb = self.dic_t[self.dic_nt[id_nt]
                                      ['gov']]['lemma'].lower()
                    #verb = re.sub('-', '_', verb)
                    contexts = self.dic_t[self.dic_nt[id_nt]['dep']]['nps']
                    for context in contexts:
                        if len(verb) >= self.min_word_size and len(
                                context) >= self.min_word_size:
                            self.__addElementDicVO__('obj_' + verb + '#' +
                                                     context)
                            self.__addElementDicDocVO__('obj_' + verb + '#' +
                                                        context)

    def __addElementDicAN__(self, relation):
        if self.dic_an.has_key(relation):
            self.dic_an[relation] += 1
        else:
            self.dic_an[relation] = 1

    def __addElementDicDocAN__(self, relation):
        if self.dic_an_doc.has_key(relation):
            self.dic_an_doc[relation] += 1
        else:
            self.dic_an_doc[relation] = 1

    def __addElementDicSV__(self, relation):
        if self.dic_sv.has_key(relation):
            self.dic_sv[relation] += 1
        else:
            self.dic_sv[relation] = 1

    def __addElementDicDocSV__(self, relation):
        if self.dic_sv_doc.has_key(relation):
            self.dic_sv_doc[relation] += 1
        else:
            self.dic_sv_doc[relation] = 1

    def __addElementDicVO__(self, relation):
        if self.dic_vo.has_key(relation):
            self.dic_vo[relation] += 1
        else:
            self.dic_vo[relation] = 1

    def __addElementDicDocVO__(self, relation):
        if self.dic_vo_doc.has_key(relation):
            self.dic_vo_doc[relation] += 1
        else:
            self.dic_vo_doc[relation] = 1

    def __writeDicRelations__(self, corpus_filename):
        file_relation_an = self.misc.openFile(
            self.temp_folder + 'AN/2Order/AN_' + corpus_filename + '.txt', 'w')
        for id_relation in self.dic_an_doc:
            file_relation_an.write(id_relation + '#' +
                                   str(self.dic_an_doc[id_relation]) + '\n')
        file_relation_an.close()

        file_relation_sv = self.misc.openFile(
            self.temp_folder + 'SV/2Order/SV_' + corpus_filename + '.txt', 'w')
        for id_relation in self.dic_sv_doc:
            file_relation_sv.write(id_relation + '#' +
                                   str(self.dic_sv_doc[id_relation]) + '\n')
        file_relation_sv.close()

        file_relation_vo = self.misc.openFile(
            self.temp_folder + 'VO/2Order/VO_' + corpus_filename + '.txt', 'w')
        for id_relation in self.dic_vo_doc:
            file_relation_vo.write(id_relation + '#' +
                                   str(self.dic_vo_doc[id_relation]) + '\n')
        file_relation_vo.close()

    def __writeDic__(self):
        for type_relation in self.matrix_relations:
            file_relation = self.misc.openFile(
                self.temp_folder + '' + type_relation +
                '/2Order/Relations.txt', 'w')
            dic_relation = self.getDic(type_relation)
            for id_relation in dic_relation:
                file_relation.write(id_relation + '#' +
                                    str(dic_relation[id_relation]) + '\n')
            file_relation.close()

    """ Get and Print methods """

    def getDic(self, type_relation):
        if type_relation == 'AN': return self.dic_an
        elif type_relation == 'SV': return self.dic_sv
        elif type_relation == 'VO': return self.dic_vo

    def printDic(self, type_relation):
        dic_relation = getDic(type_relation)
        for id_relation in self.dic_relation:
            print id_relation + ' = ' + str(self.dic_relation[id_relation])

Exemple #2

0

Afficher le fichier

Fichier : ParseStanfordXml.py Projet : rogergranada/ATCP

    def __buildDics__(self, filename):
        misc = Miscelaneous()
        xmlfile = misc.openFile(filename, "r")
        self.stoplist = misc.getStoplist("../misc/stoplist.txt")

        record_dependencies = False
        record_collapsed = False
        for line in xmlfile:
            line = re.sub("\n", "", line)
            if "<sentence " in line:
                id_s = (line.split('id="')[1]).split('"')[0]
                array_rec_dep = []
            elif "<token " in line:
                id_t = "s" + id_s + "_" + (line.split('id="')[1]).split('"')[0]
            elif "<word>" in line:
                word = (line.split("<word>")[1]).split("</word>")[0]
            elif "<lemma>" in line:
                lemma = (line.split("<lemma>")[1]).split("</lemma>")[0]
            elif "<POS>" in line:
                pos = (line.split("<POS>")[1]).split("</POS>")[0]
            elif "<NER>" in line:
                ner = (line.split("<NER>")[1]).split("</NER>")[0]
            elif "</token>" in line:
                self.dic_t[id_t] = {"word": word, "lemma": lemma, "pos": pos, "ner": ner, "nps": []}
                if re.match("NN|NNP", pos):
                    array_nps = [lemma.lower()]
                    self.dic_t[id_t]["nps"] = array_nps

            elif "<basic-dependencies>" in line:
                record_dependencies = True
                index_nt = 500
            elif "</basic-dependencies>" in line:
                record_dependencies = False
            elif "<collapsed-ccprocessed-dependencies>" in line:
                record_collapsed = True
            elif "</collapsed-ccprocessed-dependencies>" in line:
                record_collapsed = False

            if record_dependencies or record_collapsed:
                if "<dep type=" in line:
                    cat = (line.split('type="')[1]).split('"')[0]
                elif "<governor " in line:
                    idx_gov = (line.split('idx="')[1]).split('"')[0]
                    id_t_gov = "s" + id_s + "_" + idx_gov
                elif "<dependent " in line:
                    idx_dep = (line.split('idx="')[1]).split('"')[0]
                    id_t_dep = "s" + id_s + "_" + idx_dep
                elif (record_dependencies or record_collapsed) and "</dep>" in line:
                    if cat + "#" + id_t_gov + "#" + id_t_dep not in array_rec_dep:
                        array_rec_dep.append(cat + "#" + id_t_gov + "#" + id_t_dep)
                        self.dic_nt["s" + id_s + "_" + str(index_nt)] = {"cat": cat, "gov": id_t_gov, "dep": id_t_dep}
                        index_nt += 1
        xmlfile.close()

        for id_nt in self.dic_nt:
            if re.match("(nn|amod)", self.dic_nt[id_nt]["cat"]):
                array_nps = self.dic_t[self.dic_nt[id_nt]["gov"]]["nps"]
                string = ""
                id_gov = self.dic_nt[id_nt]["gov"].split("_")[1]
                id_dep = self.dic_nt[id_nt]["dep"].split("_")[1]
                id_s = self.dic_nt[id_nt]["dep"].split("_")[0]
                for i in range(int(id_dep), int(id_gov)):
                    id_next = id_s + "_" + str(i)
                    if (
                        re.match("(NN|JJ)", self.dic_t[id_next]["pos"])
                        and self.dic_t[id_next]["lemma"] not in self.stoplist
                    ):
                        string += self.dic_t[id_next]["lemma"] + "_"
                string += self.dic_t[id_s + "_" + id_gov]["lemma"]
                if len(string.split("_")) > 1 and string.lower() not in array_nps:
                    array_nps.append(string.lower())
                self.dic_t[self.dic_nt[id_nt]["gov"]]["nps"] = array_nps

            elif re.match("prep_of", self.dic_nt[id_nt]["cat"]):
                id_gov = self.dic_nt[id_nt]["gov"]
                id_dep = self.dic_nt[id_nt]["dep"]

                if re.match("NN", self.dic_t[id_dep]["pos"]) and re.match("NN", self.dic_t[id_gov]["pos"]):
                    array_nps = self.dic_t[id_dep]["nps"]
                    string = self.dic_t[id_gov]["lemma"] + "_of_" + self.dic_t[id_dep]["lemma"]
                    array_nps.append(string.lower())
                    self.dic_t[self.dic_nt[id_nt]["dep"]]["nps"] = array_nps

                    array_nps = self.dic_t[id_gov]["nps"]
                    string = self.dic_t[id_gov]["lemma"] + "_of_" + self.dic_t[id_dep]["lemma"]
                    array_nps.append(string.lower())
                    self.dic_t[self.dic_nt[id_nt]["gov"]]["nps"] = array_nps

Exemple #3

0

Afficher le fichier

Fichier : ParseStanfordXml.py Projet : rogergranada/ATCP

	def __buildDics__(self, filename):
		misc = Miscelaneous()
		xmlfile = misc.openFile(filename, 'r')
		self.stoplist = misc.getStoplist('../misc/stoplist.txt')

		record_dependencies = False
		record_collapsed = False
		for line in xmlfile:
			line = re.sub('\n', '', line)
			if '<sentence ' in line:
				id_s = (line.split('id=\"')[1]).split('\"')[0]	
				array_rec_dep = []
			elif '<token ' in line:
				id_t = 's'+id_s+'_'+(line.split('id=\"')[1]).split('\"')[0]
			elif '<word>' in line:
				word = (line.split('<word>')[1]).split('</word>')[0]
			elif '<lemma>' in line:
				lemma = (line.split('<lemma>')[1]).split('</lemma>')[0]
			elif '<POS>' in line:
				pos = (line.split('<POS>')[1]).split('</POS>')[0]
			elif '<NER>' in line:
				ner = (line.split('<NER>')[1]).split('</NER>')[0]
			elif '</token>' in line:
				self.dic_t[id_t] = {'word':word, 'lemma':lemma, 'pos':pos, 'ner':ner, 'nps':[]}
				if re.match('NN|NNP', pos):
					array_nps = [lemma.lower()]
					self.dic_t[id_t]['nps'] = array_nps

			elif '<basic-dependencies>' in line:
				record_dependencies = True
				index_nt = 500
			elif '</basic-dependencies>' in line:
				record_dependencies = False
			elif '<collapsed-ccprocessed-dependencies>' in line:
				record_collapsed = True
			elif '</collapsed-ccprocessed-dependencies>' in line:
				record_collapsed = False

			if record_dependencies or record_collapsed:
				if '<dep type=' in line:
					cat = (line.split('type=\"')[1]).split('\"')[0]
				elif '<governor ' in line:
					idx_gov = (line.split('idx=\"')[1]).split('\"')[0]
					id_t_gov = 's'+id_s+'_'+idx_gov
				elif '<dependent ' in line:
					idx_dep = (line.split('idx=\"')[1]).split('\"')[0]
					id_t_dep = 's'+id_s+'_'+idx_dep
				elif (record_dependencies or record_collapsed) and '</dep>' in line:
					if cat+'#'+id_t_gov+'#'+id_t_dep not in array_rec_dep:
						array_rec_dep.append(cat+'#'+id_t_gov+'#'+id_t_dep)	
						self.dic_nt['s'+id_s+'_'+str(index_nt)] = {'cat':cat, 'gov':id_t_gov, 'dep':id_t_dep}
						index_nt += 1
		xmlfile.close()

		for id_nt in self.dic_nt:
			if re.match("(nn|amod)", self.dic_nt[id_nt]['cat']):
				array_nps = self.dic_t[self.dic_nt[id_nt]['gov']]['nps']
				string = ''
				id_gov = self.dic_nt[id_nt]['gov'].split('_')[1]
				id_dep = self.dic_nt[id_nt]['dep'].split('_')[1]
				id_s = self.dic_nt[id_nt]['dep'].split('_')[0]
				for i in range(int(id_dep), int(id_gov)):
					id_next = id_s+'_'+str(i)
					if re.match("(NN|JJ)", self.dic_t[id_next]['pos']) and self.dic_t[id_next]['lemma'] not in self.stoplist:
						string += self.dic_t[id_next]['lemma']+'_'
				string += self.dic_t[id_s+'_'+id_gov]['lemma']
				if len(string.split('_')) > 1 and string.lower() not in array_nps:
					array_nps.append(string.lower())
				self.dic_t[self.dic_nt[id_nt]['gov']]['nps'] = array_nps

			elif re.match("prep_of", self.dic_nt[id_nt]['cat']):
				id_gov = self.dic_nt[id_nt]['gov']
				id_dep = self.dic_nt[id_nt]['dep']
				
				if re.match("NN", self.dic_t[id_dep]['pos']) and re.match("NN", self.dic_t[id_gov]['pos']):
					array_nps = self.dic_t[id_dep]['nps']
					string = self.dic_t[id_gov]['lemma']+'_of_'+self.dic_t[id_dep]['lemma']
					array_nps.append(string.lower())
					self.dic_t[self.dic_nt[id_nt]['dep']]['nps'] = array_nps

					array_nps = self.dic_t[id_gov]['nps']
					string = self.dic_t[id_gov]['lemma']+'_of_'+self.dic_t[id_dep]['lemma']
					array_nps.append(string.lower())
					self.dic_t[self.dic_nt[id_nt]['gov']]['nps'] = array_nps

Exemple #4

0

Afficher le fichier

Fichier : StanfordSyntacticContexts.py Projet : rogergranada/ATCP

class StanfordSyntacticContexts:

	def __init__(self, input_folder, temp_folder, stoplist_file, min_word_size, record_intermediate):	
		try:
			self.root, self.dirs, self.files = os.walk(input_folder).next()[:3]
		except IOError:
			print bcolors.FAIL+'ERROR: It was not possible to open the '+input_folder+' folder'+bcolors.ENDC
			sys.exit(2)

		self.min_word_size = int(min_word_size)
		self.temp_folder = temp_folder
		self.qty_documents = len(self.files)
		self.misc = Miscelaneous()
		self.stoplist = self.misc.getStoplist(stoplist_file)
		
		self.matrix_relations = ['AN', 'SV', 'VO']
		self.dic_an = {}
		self.dic_sv = {}
		self.dic_vo = {}

		command = 'rm -Rf '+self.temp_folder+'; mkdir '+self.temp_folder+' '
		if record_intermediate:
			command += self.temp_folder+'AN/'+' '+self.temp_folder+'AN/2Order/'+self.temp_folder+'AN/3Order/ '
			command += self.temp_folder+'SV/'+' '+self.temp_folder+'SV/2Order/'+self.temp_folder+'SV/3Order/ '
			command += self.temp_folder+'VO/'+' '+self.temp_folder+'VO/2Order/'+self.temp_folder+'VO/3Order/ '
		os.system(command)

		i = 0
		for corpus_file in self.files:
			self.dic_t = {}
			self.dic_nt = {}
			self.dic_an_doc = {}
			self.dic_sv_doc = {}
			self.dic_vo_doc = {}
			#print corpus_file
			i += 1
			if re.match('.*xml$', corpus_file):
				corpus_filename = corpus_file.split('.')[0]
				xml = ParseStanfordXml(self.root+''+corpus_file)
				self.dic_t = xml.getDicTerms()
				self.dic_nt = xml.getDicNonTerminals()
				self.__extractRelations__()
				if record_intermediate:
					self.__writeDicRelations__(corpus_filename)

			self.misc.progress_bar(i, self.qty_documents, 100)

		self.__writeDic__()

	def __del__(self):
		pass

	def __extractRelations__(self):
		i = 0
		#print self.dic_t
		for id_nt in self.dic_nt:
			if self.dic_nt[id_nt]['cat'] == 'nn':
				noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
				#noun = re.sub('-', '_', noun)
				context = self.dic_t[self.dic_nt[id_nt]['dep']]['lemma'].lower()
				context = re.sub('-', '_', context)
				if len(noun) >= self.min_word_size and len(context) >= self.min_word_size:
					self.__addElementDicAN__(context+'#'+noun)
					self.__addElementDicAN__(noun+'#'+context)
					self.__addElementDicDocAN__(context+'#'+noun)
					self.__addElementDicDocAN__(noun+'#'+context)

			elif self.dic_nt[id_nt]['cat'] == 'amod':
				noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
				#noun = re.sub('-', '_', noun)
				context = self.dic_t[self.dic_nt[id_nt]['dep']]['lemma'].lower()
				context = re.sub('-', '_', context)
				if len(noun) >= self.min_word_size and len(context) >= self.min_word_size and context not in self.stoplist:
					self.__addElementDicAN__(context+'#'+noun)
					self.__addElementDicDocAN__(context+'#'+noun)
				
			if re.match('prep_', self.dic_nt[id_nt]['cat']) \
				and re.match('^NN', self.dic_t[self.dic_nt[id_nt]['dep']]['pos'])  \
				and re.match('^NN', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
				noun = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
				#noun = re.sub('-', '_', noun)
				context = self.dic_t[self.dic_nt[id_nt]['dep']]['lemma'].lower()
				context = re.sub('-', '_', context)
				prep = self.dic_nt[id_nt]['cat'].split('_')[1]
				if len(noun) >= self.min_word_size and len(context) >= self.min_word_size:
					self.__addElementDicAN__(prep+'_'+context+'#'+noun)
					self.__addElementDicAN__(prep+'_'+noun+'#'+context)
					self.__addElementDicDocAN__(prep+'_'+context+'#'+noun)
					self.__addElementDicDocAN__(prep+'_'+noun+'#'+context)

			elif re.match('^(nsubjpass|nsubj|xsubj|agent)$', self.dic_nt[id_nt]['cat']): #gov = verb
				if re.match('V', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
					verb = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
					#verb = re.sub('-', '_', verb)
					contexts = self.dic_t[self.dic_nt[id_nt]['dep']]['nps']
					for context in contexts:
						if len(verb) >= self.min_word_size and len(context) >= self.min_word_size:
							self.__addElementDicSV__('sub_'+verb+'#'+context)
							self.__addElementDicDocSV__('sub_'+verb+'#'+context)
			
			elif re.match('^(dobj|iobj)$', self.dic_nt[id_nt]['cat']):
				if re.match('V', self.dic_t[self.dic_nt[id_nt]['gov']]['pos']):
					verb = self.dic_t[self.dic_nt[id_nt]['gov']]['lemma'].lower()
					#verb = re.sub('-', '_', verb)
					contexts = self.dic_t[self.dic_nt[id_nt]['dep']]['nps']
					for context in contexts:
						if len(verb) >= self.min_word_size and len(context) >= self.min_word_size:
							self.__addElementDicVO__('obj_'+verb+'#'+context)
							self.__addElementDicDocVO__('obj_'+verb+'#'+context)

	def __addElementDicAN__(self, relation):
		if self.dic_an.has_key(relation):
			self.dic_an[relation] += 1
		else:
			self.dic_an[relation] = 1

	def __addElementDicDocAN__(self, relation):
		if self.dic_an_doc.has_key(relation):
			self.dic_an_doc[relation] += 1
		else:
			self.dic_an_doc[relation] = 1

	def __addElementDicSV__(self, relation):
		if self.dic_sv.has_key(relation):
			self.dic_sv[relation] += 1
		else:
			self.dic_sv[relation] = 1

	def __addElementDicDocSV__(self, relation):
		if self.dic_sv_doc.has_key(relation):
			self.dic_sv_doc[relation] += 1
		else:
			self.dic_sv_doc[relation] = 1

	def __addElementDicVO__(self, relation):
		if self.dic_vo.has_key(relation):
			self.dic_vo[relation] += 1
		else:
			self.dic_vo[relation] = 1

	def __addElementDicDocVO__(self, relation):
		if self.dic_vo_doc.has_key(relation):
			self.dic_vo_doc[relation] += 1
		else:
			self.dic_vo_doc[relation] = 1

	def __writeDicRelations__(self, corpus_filename):
		file_relation_an = self.misc.openFile(self.temp_folder+'AN/2Order/AN_'+corpus_filename+'.txt', 'w')
		for id_relation in self.dic_an_doc:
			file_relation_an.write(id_relation+'#'+str(self.dic_an_doc[id_relation])+'\n')
		file_relation_an.close()

		file_relation_sv = self.misc.openFile(self.temp_folder+'SV/2Order/SV_'+corpus_filename+'.txt', 'w')
		for id_relation in self.dic_sv_doc:
			file_relation_sv.write(id_relation+'#'+str(self.dic_sv_doc[id_relation])+'\n')
		file_relation_sv.close()

		file_relation_vo = self.misc.openFile(self.temp_folder+'VO/2Order/VO_'+corpus_filename+'.txt', 'w')
		for id_relation in self.dic_vo_doc:
			file_relation_vo.write(id_relation+'#'+str(self.dic_vo_doc[id_relation])+'\n')
		file_relation_vo.close()

	def __writeDic__(self):
		for type_relation in self.matrix_relations:
			file_relation = self.misc.openFile(self.temp_folder+''+type_relation+'/2Order/Relations.txt', 'w')
			dic_relation = self.getDic(type_relation)
			for id_relation in dic_relation:
				file_relation.write(id_relation+'#'+str(dic_relation[id_relation])+'\n')
			file_relation.close()

	""" Get and Print methods """

	def getDic(self, type_relation):
		if type_relation == 'AN': return self.dic_an
		elif type_relation == 'SV': return self.dic_sv
		elif type_relation == 'VO': return self.dic_vo

	def printDic (self, type_relation):
		dic_relation = getDic(type_relation)
		for id_relation in self.dic_relation:
			print id_relation+' = '+str(self.dic_relation[id_relation])