Python get_category_urls 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: bnext_parser

메소드/함수: get_category_urls

hotexamples.com에서의 예제들: 2

Python get_category_urls - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 bnext_parser.get_category_urls에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

def _test_get_category_urls(test_file):

    print("\n====================== category urls =========================\n")
    print("".join([
        "Testing get_category_urls(), don't warry if you see some log on \n",
        "the fly, they are for the porpose of analyzing webpage, the fail \n",
        "of testing would be shown by [assert]\n"
    ]))

    if os.path.isfile(test_file) is False:
        print("".join([
            "Error: can't find test_file: {}, please check filename or",
            " generate new test_file\n"
        ]).format(test_file))
        return False

    f = open(test_file)
    obj = pkl.load(f)
    print_time(obj)

    ground_input = obj['ground_input']
    ground_truth = obj['ground_truth']

    for i, url in enumerate(ground_input):
        retry = 0
        while retry < _RETRY_LIMIT:
            try:
                ret = bnext_parser.get_category_urls(url,
                                                     back_counting_offset=3)
                ret = ret[-40:]
                if ret != ground_truth[i]:
                    print('test failed: {}\n'.format(url))
                    return False
                break
            except ConnectionError:
                retry += 1
                print('({}/{}) retrying...'.format(retry, _RETRY_LIMIT))
                time.sleep(randint(10, 15))

        sys.stdout.write('.')
        # time.sleep(1)

    return True
    print('\nSuccess')

예제 #2

파일 보기

def generate_get_category_testcase(ground_input):
    global _pseudo_request_response_dict

    generating_time = datetime.now()
    ground_truth = []

    for url in ground_input:
        ret = bnext_parser.get_category_urls(url, back_counting_offset=3)
        ground_truth.append(ret[-40:])

# ========================================================================================
# Getting needed responses for "mocking requests.get()""
# ========================================================================================
        res = requests.get(url)
        _pseudo_request_response_dict[url] = res
        prefix = 'http://www.bnext.com.tw'
        soup = BeautifulSoup(res.content)
        page_list = soup.find('ul', 'pagination')
        last_page = page_list.findAll('a')[-1]['href']
        midfix = '?p='
        last_page = int(last_page.split('=')[-1]) + 1
        starting_page = last_page - 3

        for page in range(starting_page, last_page):
            res = try_response(url + midfix + str(page))
            _pseudo_request_response_dict[url + midfix + str(page)] = res

# ========================================================================================
# Dumping testcases to file
# ========================================================================================

    obj = {'ground_input': ground_input, 'ground_truth': ground_truth,
           'generating_time': generating_time}

    with open(
      './bnext/resources/testcase/get_category_urls_testcase.pkl',
      'w') as f:

        pkl.dump(obj, f)

    return ground_truth