Python generate_skip_list 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: index

메소드/함수: generate_skip_list

hotexamples.com에서의 예제들: 7

Python generate_skip_list - 7개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 index.generate_skip_list에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: search.py 프로젝트: ousys/NaturalLanguage

def intersect_with_skips(p1, p2):
    """
    algorithm in figure 2.10 of IIR
    intersect two postings lists together
    """
    if p1 == [] or p2 == []: return []
    
    answer = []
    ptr1 = 0
    ptr2 = 0
    #print "here ", p1 ,p2
    while ptr1 != len(p1) and ptr2 != len(p2):
        if p1[ptr1][0][0] == p2[ptr2][0][0]:
            answer.append(p1[ptr1][0][0])
            ptr1 += 1
            ptr2 += 1
        else:
            if p1[ptr1][0][0] < p2[ptr2][0][0]:
                # len(p1[ptr1]) == 2 means hasSkip
                # p1[ptr1][1] is the skip pointer
                if len(p1[ptr1]) == 2 and p1[ p1[ptr1][1] ][0] <= p2[ptr2][0][0]:
                    while len(p1[ptr1]) == 2 and p1[ p1[ptr1][1] ][0] <= p2[ptr2][0][0]:
                        ptr1 = p1[ptr1][1]
                else:
                    ptr1 += 1
            else:
                if len(p2[ptr2]) == 2 and p2[ p2[ptr2][1] ][0] <= p1[ptr1][0][0]:
                    while len(p2[ptr2]) == 2 and p2[ p2[ptr2][1] ][0] <= p1[ptr1][0][0]:
                        ptr2 = p2[ptr2][1]
                else:
                    ptr2 += 1
    if answer == []:
        return []
    else:
        return [[e] for e in index.generate_skip_list(answer, always_insert_skips)]

예제 #2

파일 보기

파일: search.py 프로젝트: dw6/NUS

def union_with_skips(p1, p2):
    """
    union two postings lists together
    """
    tmp_dict = {}
    for a in p1:
        tmp_dict[a[0]] = 1
    for a in p2:
        tmp_dict[a[0]] = 1
    answer = tmp_dict.keys()
    answer.sort()
    answer = index.generate_skip_list(answer, always_insert_skips)
    return answer

예제 #3

파일 보기

파일: search.py 프로젝트: ousys/NaturalLanguage

def union_with_skips(p1, p2):
    """
    union two postings lists together
    """
    tmp_dict = {}
    for a in p1:
        tmp_dict[a[0][0]] = 1
    for a in p2:
        tmp_dict[a[0][0]] = 1
    answer = tmp_dict.keys()
    answer.sort()
    answer = index.generate_skip_list(answer, always_insert_skips)
    answer = [[e] for e in answer]
    return answer

예제 #4

파일 보기

파일: search.py 프로젝트: ousys/NaturalLanguage

def process_NOT(a):
    # read the postings list for all doc ID's into all_fids when this function is first called
    global all_fids
    if all_fids == None:
        #all_fids = [pair[0] for pair in eval(linecache.getline(postings_file, 1))]
        print all_length
        f.seek(0)
        all_fids = [pair[0][0] for pair in singleline(f.read(all_length))]
        
    if not isinstance(a, list):
        f.seek(word_dict[a][1])
        a_fids = [pair[0][0] for pair in singleline(f.read(word_dict[a][2]))]
    else:
        a_fids = [pair[0][0] for pair in a]
    other_fids = filter(lambda a: a not in a_fids, all_fids)
    return [[e] for e in index.generate_skip_list(other_fids, always_insert_skips)]

예제 #5

파일 보기

파일: search.py 프로젝트: ousys/NaturalLanguage

def process_NOT(a):
    # read the postings list for all doc ID's into all_fids when this function is first called
    global all_fids
    if all_fids == None:
        #all_fids = [pair[0] for pair in eval(linecache.getline(postings_file, 1))]
        print all_length
        f.seek(0)
        all_fids = [pair[0][0] for pair in singleline(f.read(all_length))]

    if not isinstance(a, list):
        f.seek(word_dict[a][1])
        a_fids = [pair[0][0] for pair in singleline(f.read(word_dict[a][2]))]
    else:
        a_fids = [pair[0][0] for pair in a]
    other_fids = filter(lambda a: a not in a_fids, all_fids)
    return [[e]
            for e in index.generate_skip_list(other_fids, always_insert_skips)]

예제 #6

파일 보기

파일: search.py 프로젝트: dw6/NUS

def process_NOT(a):
    # read the postings list for all doc ID's into all_fids when this function is first called
    global all_fids
    if all_fids == None:

        all_fids = [pair[0] for pair in eval(linecache.getline("all_id.txt", 1))]
    if not isinstance(a, list):
       
        start_byte = word_dict[a[0]][1]
        num_bytes = word_dict[a[0]][2]
        
        fh = open(postings_file)
        fh.seek(start_byte)
        bytestream = fh.read(num_bytes)
        lst = compress.uncompress_postings_list(bytestream)
        
        a_fids = [pair[0] for pair in lst]
    else:
        a_fids = [pair[0] for pair in a]
    
    other_fids = filter(lambda a: a not in a_fids, all_fids)
    return index.generate_skip_list(other_fids, always_insert_skips)

예제 #7

파일 보기

파일: search.py 프로젝트: ousys/NaturalLanguage

def intersect_with_skips(p1, p2):
    """
    algorithm in figure 2.10 of IIR
    intersect two postings lists together
    """
    if p1 == [] or p2 == []: return []

    answer = []
    ptr1 = 0
    ptr2 = 0
    #print "here ", p1 ,p2
    while ptr1 != len(p1) and ptr2 != len(p2):
        if p1[ptr1][0][0] == p2[ptr2][0][0]:
            answer.append(p1[ptr1][0][0])
            ptr1 += 1
            ptr2 += 1
        else:
            if p1[ptr1][0][0] < p2[ptr2][0][0]:
                # len(p1[ptr1]) == 2 means hasSkip
                # p1[ptr1][1] is the skip pointer
                if len(p1[ptr1]) == 2 and p1[p1[ptr1][1]][0] <= p2[ptr2][0][0]:
                    while len(p1[ptr1]
                              ) == 2 and p1[p1[ptr1][1]][0] <= p2[ptr2][0][0]:
                        ptr1 = p1[ptr1][1]
                else:
                    ptr1 += 1
            else:
                if len(p2[ptr2]) == 2 and p2[p2[ptr2][1]][0] <= p1[ptr1][0][0]:
                    while len(p2[ptr2]
                              ) == 2 and p2[p2[ptr2][1]][0] <= p1[ptr1][0][0]:
                        ptr2 = p2[ptr2][1]
                else:
                    ptr2 += 1
    if answer == []:
        return []
    else:
        return [[e]
                for e in index.generate_skip_list(answer, always_insert_skips)]