Python Data.write_dataStruct_to_file Examples

Programming Language: Python

Namespace/Package Name: core

Class/Type: Data

Method/Function: write_dataStruct_to_file

Examples at hotexamples.com: 6

Python Data.write_dataStruct_to_file - 6 examples found. These are the top rated real world Python examples of core.Data.write_dataStruct_to_file extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

read_dataStruct_from_file(7)

Data(4)

pop(4)

write_dataStruct_to_file(3)

get_activity(2)

get_channel(2)

get_owners(2)

push(2)

addAttribute(1)

get_bots(1)

get_help_embeds(1)

Example #1

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createPostingList(sortTepDic):

    posting = {}
    for key in sortTepDic.keys():
        posting[key] = [DocId for DocId in sortTepDic[key][0]]

    Data.write_dataStruct_to_file(Contants.POSTING_LIST_FILE_NAME, posting)

Example #2

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createPostingList(sortTepDic):

    posting = {}
    for key in sortTepDic.keys():
        posting[key] = [DocId for DocId in sortTepDic[key][0]]

    Data.write_dataStruct_to_file(Contants.POSTING_LIST_FILE_NAME, posting)

Example #3

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createTermIndex():
    sortTepDic = SortedDict()
    #Structure for each term
    #   sortTepDic['term']=({'DocId1':['Pos1','Pos2'],'DocId2':['Pos1','Pos2']},'termFreq','DocFreq')

    for root, dirs, files in os.walk(Contants.DATA_DIRECTORY_NAME,
                                     topdown=True):
        for name in files:
            file_name = os.path.join(root, name)
            #         'r' when the file will only be read
            #         'w' for only writing (an existing file with the same name will be erased)
            #         'a' opens the file for appending; any data written to the file is automatically added to the end.
            #         'r+' opens the file for both reading and writing.

            mode = 'r'
            file_object = open(file_name, mode)
            DocId = os.path.split(file_name)[1]

            wordPos = 0
            for word in file_object.read().split():

                wordPos = wordPos + 1  #increment word location
                lamma = applyFilters(word)

                if lamma:
                    if lamma not in sortTepDic:
                        sortTepDic[lamma] = [{
                            DocId: [wordPos]
                        }, 1, 1]  #add a new term

                    else:

                        sortTepDic[lamma][1] = sortTepDic[lamma][
                            1] + 1  #increment the term frequency

                        if DocId in sortTepDic[lamma][0]:
                            sortTepDic[lamma][0][DocId].append(
                                wordPos
                            )  #add new word position for the existing document
                        else:
                            sortTepDic[lamma][0][DocId] = [
                                wordPos
                            ]  #add a new document ID and he word position
                            sortTepDic[lamma][2] = sortTepDic[lamma][
                                2] + 1  #increment the document frequecy

    #covert lists to tuples
    for key in sortTepDic.keys():
        for DocId in sortTepDic[key][0]:
            sortTepDic[key][0][DocId] = tuple(sortTepDic[key][0][DocId])
        sortTepDic[key] = tuple(sortTepDic[key])

    Data.write_dataStruct_to_file(Contants.WORD_INDEX_FILE_NAME, sortTepDic)
    createLexicon(sortTepDic)
    createPostingList(sortTepDic)

Example #4

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createTermIndex():
    sortTepDic = SortedDict()
    # Structure for each term
    #   sortTepDic['term']=({'DocId1':['Pos1','Pos2'],'DocId2':['Pos1','Pos2']},'termFreq','DocFreq')

    for root, dirs, files in os.walk(Contants.DATA_DIRECTORY_NAME, topdown=True):
        for name in files:
            file_name = os.path.join(root, name)
            #         'r' when the file will only be read
            #         'w' for only writing (an existing file with the same name will be erased)
            #         'a' opens the file for appending; any data written to the file is automatically added to the end.
            #         'r+' opens the file for both reading and writing.

            mode = "r"
            file_object = open(file_name, mode)
            DocId = os.path.split(file_name)[1]

            wordPos = 0
            for word in file_object.read().split():

                wordPos = wordPos + 1  # increment word location
                lamma = applyFilters(word)

                if lamma:
                    if lamma not in sortTepDic:
                        sortTepDic[lamma] = [{DocId: [wordPos]}, 1, 1]  # add a new term

                    else:

                        sortTepDic[lamma][1] = sortTepDic[lamma][1] + 1  # increment the term frequency

                        if DocId in sortTepDic[lamma][0]:
                            sortTepDic[lamma][0][DocId].append(
                                wordPos
                            )  # add new word position for the existing document
                        else:
                            sortTepDic[lamma][0][DocId] = [wordPos]  # add a new document ID and he word position
                            sortTepDic[lamma][2] = sortTepDic[lamma][2] + 1  # increment the document frequecy

    # covert lists to tuples
    for key in sortTepDic.keys():
        for DocId in sortTepDic[key][0]:
            sortTepDic[key][0][DocId] = tuple(sortTepDic[key][0][DocId])
        sortTepDic[key] = tuple(sortTepDic[key])

    Data.write_dataStruct_to_file(Contants.WORD_INDEX_FILE_NAME, sortTepDic)
    createLexicon(sortTepDic)
    createPostingList(sortTepDic)

Example #5

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createLexicon(sortTepDic):

    keys = [key for key in sortTepDic.keys()]
    Data.write_dataStruct_to_file(Contants.LEXICON_FILE_NAME, keys)

Example #6

0

Show file

File: Index.py Project: sheecegardezi/Information_Retrieval

def createLexicon(sortTepDic):

    keys = [key for key in sortTepDic.keys()]
    Data.write_dataStruct_to_file(Contants.LEXICON_FILE_NAME, keys)