Пример #1
0
def build_season():
    if Season.objects.count():
        print('Already loaded seasons')
        return

    seasons = Game.objects.distinct('season')
    for team in Team.objects():
        print("Parsing " + team.name)
        for season in seasons:
            games = Game.objects(Q(home=team) | Q(away=team)).filter(season=season)
            doc = Season(
                team=team,
                season=season
            )
            doc.save()
            for game in games:
                doc.update(push__games=game)

            if games.count() < 16:
                print('Season has less than 16 games')
                print(season.__repr__())
Пример #2
0
def build_plays():
    if not Play.objects.count():
        print('No plays in database')
        return
    if not Team.objects.count():
        print('No teams in database')
        return

    # cache teams in dictionary
    teams = {}
    for team in Team.objects():
        teams[team.name] = team

    def parse_team(team_name):
        return teams[team_name]

    def parse_game_id(game_id):
        game_string = game_id.split('_', 1)
        data = game_string[0]
        teams_in_game = game_string[1].split('@')
        d = date(
            year=int(data[:4]),
            month=int(data[4:6]),
            day=int(data[6:8])
        )
        away = parse_team(teams_in_game[0])
        home = parse_team(teams_in_game[1])
        return d, home, away

    def parse_description(desc):
        pass
        # TODO: add metadata to plays

    def parse_season(date_of_match):
        offset = 0
        if date_of_match.month < 4:
            offset = -1
        return date_of_match.year + offset

    def cast_int(play, value, default):
        # None, '', '.B'
        if value is None or value == '':
            return default
        try:
            return int(value)
        except:
            print('Exception casting ' + str(value) + ' as integer')
            print(play.__repr__())
            return default

    counter = 0
    for play in Play.objects:
        if counter % 1000 == 0:
            print('Parsed ' + str(counter) + ' plays')
        counter += 1
        if not play.gameid:
            print('Deleting empty document ' + str(play.id))
            print(play.__repr__())
            play.delete()
            continue
        play.min = cast_int(play, play.min, 60)
        play.sec = cast_int(play, play.sec, 0)
        play.down = cast_int(play, play.down, None)
        play.togo = cast_int(play, play.togo, None)
        play.yardline = cast_int(play, play.yardline, None)
        play.defscore = cast_int(play, play.defscore, 0)
        play.offscore = cast_int(play, play.offscore, 0)
        play.date, play.home, play.away = parse_game_id(play.gameid)
        play.possession = parse_team(play.offense) if play.offense else None
        play.season = cast_int(play, play.season, parse_season(play.date))
        play.save()

    print('Parsed ' + str(counter) + ' plays')