Ejemplos de Utilities.is_CIK_valid en Python

Lenguaje de programación: Python

Clase / Tipo: Utilities

Método / Función: is_CIK_valid

Ejemplos en hotexamples.com: 3

Python Utilities.is_CIK_valid - 3 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de Utilities.is_CIK_valid de paquete facebook_page_scraper extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Métodos usados con frecuencia

Mostrar Ocultar

format_CIK(13)

write_result_to_file(10)

AverageMeter(9)

mkdir(9)

tokenizeFile(7)

init_distribution(7)

get_err_from_predict(7)

sanitize_filing_year(6)

failExecution(6)

setup_db(5)

printFrequencies(5)

connect(5)

replace_zero_label_with_neg_one(5)

insert_entries(5)

pre_compute_threshes(4)

getIndentSize(4)

print_to_file(3)

findNextNonWhiteSpaceCharIndex(3)

getPyQt4ModulesDirectory(3)

get_alpha_numeric_count(3)

pwDecode(3)

get_random_name(3)

get_suffix(3)

printInfo(3)

rmTree(3)

is_CIK_valid(3)

parse_time(3)

isInsideTextLiteral(3)

get_prefix(3)

check_number(3)

check_capital(3)

check_bar(3)

get_f_ranking_from_predictions(2)

from_dungeon_level(2)

rot_center(2)

pwEncode(2)

get_auc_from_predict(2)

BhattacharyaCoeff(2)

checkBlacklistedVersions(2)

maximalElements(2)

collateFrequencies(2)

chat(2)

pre_compute_threshes_uci(2)

pre_compute_threshes_8news(2)

character_counter(2)

isSubList(2)

is_inside_frustum(2)

listMerge(2)

loadAll(2)

normalise_plurk_id(2)

Ejemplo n.º 1

Mostrar archivo

Archivo: litigationmatcher.py Proyecto: mchrzanowski/SEC10KParser

def _perform_check_and_write_to_results_file(case_pattern, row, row_holder):

    print "Start:", row.index, row.CIK, case_pattern.pattern, row.case_name

    # check if CIK is valid.
    if Utilities.is_CIK_valid(row.CIK):
        for year in xrange(2004, 2012 + 1):

            raw_data = _get_raw_data(row.CIK, year)

            if raw_data is not None:
                if re.search(case_pattern, raw_data):
                    row.case_mentioned_in_a_10k_for_a_year(year)

    row_holder.append(row.construct_row_with_ordered_fields())

Ejemplo n.º 2

Mostrar archivo

Archivo: litigationmatcher.py Proyecto: mchrzanowski/SEC10KParser

def _read_ouput_file_and_get_finished_indices():
    '''
        read the output file and see which indices exist in there. those are the finished rows.
        also read the rows for the already-learned CIK/plaintiff mapping
    '''
    reader = csv.reader(open(Constants.PATH_TO_NEW_LITIGATION_FILE, 'rb'), delimiter=',')

    results = set()

    for row in reader:
        index = row[0]
        CIK = row[2]
        plaintiff = row[3]

        results.add(index)
        if Utilities.is_CIK_valid(CIK):
            _name_to_cik_mapping[plaintiff] = CIK

    return results

Ejemplo n.º 3

Mostrar archivo

Archivo: litigationmatcher.py Proyecto: mchrzanowski/SEC10KParser

def main(items_to_add):

    finished_indices = _read_ouput_file_and_get_finished_indices()

    pool = multiprocessing.Pool(maxtasksperchild=15)

    row_holder = _manager.list()

    processed_index_counter = 0

    litigation_reader = csv.reader(open(Constants.PATH_TO_LITIGATION_FILE, 'rb'), delimiter=',')

    for row in litigation_reader:

        row_object = NewRowGenerator(*row)

        # already processed.
        if row_object.index in finished_indices:
            continue

        # intentionally skip.
        if row_object.CIK == Constants.CIK_CODE_TO_INDICATE_ROW_SHOULD_BE_SKIPPED:
            continue

        processed_index_counter += 1

        if processed_index_counter > items_to_add:
            break

        #print "BEGIN:", row

        # rows always have a plaintiff but not always a CIK.
        if not Utilities.is_CIK_valid(row_object.CIK):
            # if this row has the CIK-company name mapping, cache it.
            # update the key-value pairing with each row iteration
            # as company CIKSs can change as time goes on.
            if len(row_object.plaintiff) > 0:
                _name_to_cik_mapping[row_object.plaintiff] = row_object.CIK

        else:
            # this row didnt have a CIK. first, check previous rows for the mapping we want.
            # if that doesn't exist, use the company name and edgar to get the
            # potential CIK.
            result = _get_potential_cik_from_company_name(row_object.plaintiff)
            if result is not None:
                row_object.CIK = result

        if not Utilities.is_CIK_valid(row_object.CIK):
            print "Error: No CIK. Index:", row_object.index
            #continue

        case_pattern = _get_first_word_of_case_name(row_object.case_name)

        #_perform_check_and_write_to_results_file(case_pattern, row_object, row_holder)

        pool.apply_async(_perform_check_and_write_to_results_file, \
            args=(case_pattern, row_object, row_holder))

    pool.close()
    pool.join()

    litigation_writer = csv.writer(open(Constants.PATH_TO_NEW_LITIGATION_FILE, 'ab'), delimiter=',')
    for row in row_holder:
        litigation_writer.writerow(row)