Exemplo n.º 1
0
def insert_race(soup):
    # Extract year and month field
    year_month = soup.find("h3", {"class": "midashi3rd"}).string
    year = formatter("(\d+)年\d+月", year_month, "int")
    month = formatter("\d+年(\d+)月", year_month, "int")

    for row in soup.select("tbody tr"):
        cells = row.findAll('td')

        if len(cells) > 2 and cells[0].find("a") is not None:
            race_id_without_round = "20" + formatter("\d+", get_from_a(
                cells[0]))
            day = formatter("(\d+)日([日月火水木金土])", str(cells[0]), "int")
            place_id = race_id_without_round[4:6]
            place_name = to_place_name(place_id)
            days = int(race_id_without_round[6:8])
            times = int(race_id_without_round[8:10])

            for r in range(1, 13):
                Race.objects.get_or_create(race_id=race_id_without_round +
                                           str(r).zfill(2),
                                           race_dt=date(year, month, day),
                                           place_id=place_id,
                                           place_name=place_name,
                                           days=days,
                                           times=times,
                                           round=r)
    return
Exemplo n.º 2
0
def update_race_result(soup, race):
    race.title = soup.find("title").string.split(u"|")[0]
    race.grade = formatter(
        "\((G\d)\)", str(soup.find("dl", {
            "class": "racedata"
        }).find("h1")))

    # RACE DETAILS
    line = soup.find("dl", attrs={
        "class": "racedata"
    }).find("span").string.split(u"\xa0/\xa0")
    race.type = to_course_full(formatter("[芝ダ障]", line[0]))
    race.length = formatter("\d{4}", line[0], "int")
    race.weather = formatter("晴|曇|小雨|雨|小雪|雪", line[1])
    race.condition = formatter("良|稍重|重|不良", line[2])

    # RACE SUMMARY INFORMATION
    race.head_count, race.max_prize = agg_results(race)

    race.result_flg = True
    race.save()
    return
Exemplo n.º 3
0
def parse_entry_8(cells, race):
    result = Result()

    result.race = race
    result.horse_id = formatter("\d+", get_from_a(cells[1]))
    result.horse_name = formatter("[^!-~\xa0]+", get_from_a(cells[1], "name"))
    result.key = race.race_id + result.horse_id
    result.sex = formatter("[牡牝騸セ]", cells[2].string)
    result.age = formatter("\d+", cells[2].string, "int")
    result.burden = formatter("(\d+).?\d?", cells[3].string, "float")
    result.jockey_id = formatter("\d+", get_from_a(cells[4]))
    result.jockey_name = formatter("[^!-~\xa0]+", get_from_a(cells[4], "name"))
    result.trainer_id = formatter("\d+", get_from_a(cells[5]))
    result.trainer_name = formatter("[^!-~\xa0]+",
                                    get_from_a(cells[5], "name"))
    result.odds = 0
    result.odor = 0

    return result
Exemplo n.º 4
0
def update_race_entry(soup, race):
    # Parse HTML
    racedata = soup.find("dl", {"class": "racedata"}).find("dd")
    course = racedata.find_all("p")[0].string
    conditions = racedata.find_all("p")[1].string.split(u"\xa0/\xa0")
    otherdata = soup.find("div", {"class": "race_otherdata"}).findAll('p')

    race.title = formatter("[^!-~\xa0]+", str(racedata.find('h1')))
    race.type = to_course_full(formatter("[芝ダ障]", course))
    race.length = formatter("\d{4}", course, "int")
    race.weather = formatter("晴|曇|小雨|雨|小雪|雪", conditions[1])
    race.condition = formatter("良|稍重|重|不良", conditions[2])
    race.head_count = formatter("\d+", otherdata[1].string, "int")
    race.max_prize = formatter("\d+", otherdata[2].string, "int")

    race.save()
    return
Exemplo n.º 5
0
def parse_entry_12(cells, race):
    result = Result()

    result.race = race
    result.bracket = formatter("\d+", cells[0].string, "int")
    result.horse_num = formatter("\d+", cells[1].string, "int")
    result.horse_id = formatter("\d+", get_from_a(cells[3]))
    result.horse_name = formatter("[^!-~\xa0]+", get_from_a(cells[3], "name"))
    result.key = race.race_id + result.horse_id
    result.sex = formatter("[牡牝騸セ]", cells[4].string)
    result.age = formatter("\d+", cells[4].string, "int")
    result.burden = formatter("(\d+).?\d?", cells[5].string, "float")
    result.jockey_id = formatter("\d+", get_from_a(cells[6]))
    result.jockey_name = formatter("[^!-~\xa0]+", get_from_a(cells[6], "name"))
    result.trainer_id = formatter("\d+", get_from_a(cells[7]))
    result.trainer_name = formatter("[^!-~\xa0]+",
                                    get_from_a(cells[7], "name"))
    result.odds = formatter("\d+.\d+", cells[8].string, "float")
    result.odor = formatter("\d+", cells[9].string, "int")

    return result
Exemplo n.º 6
0
def parse_result(cells, race, tof):
    result = Result()

    result.race = race
    result.rank = formatter("\d+", cells[0].string, "int")
    result.bracket = formatter("\d+", cells[1].string, "int")
    result.horse_num = formatter("\d+", cells[2].string, "int")
    result.horse_id = formatter("\d+", get_from_a(cells[3]))
    result.horse_name = formatter("[^!-~\xa0]+", get_from_a(cells[3], "name"))
    result.key = race.race_id + result.horse_id
    result.sex = formatter("[牡牝騸セ]", cells[4].string)
    result.age = formatter("\d+", cells[4].string, "int")
    result.burden = formatter("(\d+).?\d?", cells[5].string, "float")
    result.jockey_id = formatter("\d+", get_from_a(cells[6]))
    result.jockey_name = formatter("[^!-~\xa0]+", get_from_a(cells[6], "name"))

    if cells[7].string is not None:
        tmp_time = re.split(r"[:.]", cells[7].string)
        tmp_time = [int(i) for i in tmp_time]  # Type conversion
        tmp_sec = (tmp_time[0] * 60 + tmp_time[1]) + (tmp_time[2] / 10)
        result.finish_time = tmp_sec
    result.time_lag = round(
        result.finish_time -
        tof, 2) if result.finish_time is not None and tof != 0 else 0

    result.last3f_time = formatter("\d+.\d+", cells[11].string, "float")
    result.odds = formatter("\d+.\d+", cells[12].string, "float")
    result.odor = formatter("\d+", cells[13].string, "int")
    result.weight = formatter("(\d+)\([+-]?\d*\)", cells[14].string, "int")
    result.weight_diff = formatter("\d+\(([+-]?\d+)\)", cells[14].string,
                                   "int")
    result.trainer_id = formatter("\d+", get_from_a(cells[15]))
    result.trainer_name = formatter("[^!-~\xa0]+",
                                    get_from_a(cells[15], "name"))
    result.owner_id = formatter("\d+", get_from_a(cells[19]))
    result.owner_name = formatter("[^!-~\xa0]+", get_from_a(cells[19], "name"))
    result.prize = formatter("\d*,?\d*.?\d+", cells[20].string, "float")

    return result