Python getDataType примеры использования

Язык программирования: Python

Пространство имен/Пакет: genBSandURLtools

Метод/Функция: getDataType

Примеров на hotexamples.com: 4

Python getDataType - 4 примера найдено. Это лучшие примеры Python кода для genBSandURLtools.getDataType, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Пример #1

Показать файл

def getESPNbox(data_in, mode='url'):
    '''
    url is a box score url obtained from score-summary ESPN page;
    use BeautifulSoup to parse apart data_in; all relevant data found
    in 'table' HTML structures, hence we grab those;
    '''
    tables = genBSandURLtools.getDataType(data_in, 'table', mode)
    summary = [t for t in tables if t.text.find('STARTERS') > -1]
    if summary:
        summary = summary[0].findAll('tr')
    else:
        raise AttributeError, "Houston, there is a f*****g problem"
    details = []
    content = []
    for line in summary:
        '''
        "details" are headers, teams stuff;
        "content" is actual player data
        '''
        details.append([str(h.text) for h in line.findAll('th')])
        content.append([str(h.text) for h in line.findAll('td')])
    playerlink_dict = getESPNplayerlinks(summary)
    return {
        'details': details,
        'content': content,
        'playerlinks': playerlink_dict
    }

Пример #2

Показать файл

Файл: parseESPN.py Проект: abresler/NBA-Data-Stuff

def getESPNpbp(data_in, mode='url'):
    '''
    url is a play-by-play url obtained from score-summary ESPN page;
    use BeautifulSoup to parse apart data_in; all relevant data found
    in 'table' HTML structures, hence we grab those;
    '''
    tables          = genBSandURLtools.getDataType(data_in, 'table', mode)
    pbp             = [t for t in tables if t.text.find('TIME') > -1]
    if pbp:
        pbp         = pbp[0].findAll('tr')
    else:
        raise AttributeError, "Houston, there is a f*****g problem"
    '''Use BS to get the headers (e.g., home and away team for game)'''
    header          = [str(h.text) for h in pbp[1].findAll('th')] # time, away, score, home
    content         = []
    for line in pbp[2:]:
        temp        = line.findAll('td')
        content.append([str(e.text) for e in temp])
    return {'head':header, 'content':content}

Пример #3

Показать файл

def getESPNpbp(data_in, mode='url'):
    '''
    url is a play-by-play url obtained from score-summary ESPN page;
    use BeautifulSoup to parse apart data_in; all relevant data found
    in 'table' HTML structures, hence we grab those;
    '''
    tables = genBSandURLtools.getDataType(data_in, 'table', mode)
    pbp = [t for t in tables if t.text.find('TIME') > -1]
    if pbp:
        pbp = pbp[0].findAll('tr')
    else:
        raise AttributeError, "Houston, there is a f*****g problem"
    '''Use BS to get the headers (e.g., home and away team for game)'''
    header = [str(h.text)
              for h in pbp[1].findAll('th')]  # time, away, score, home
    content = []
    for line in pbp[2:]:
        temp = line.findAll('td')
        content.append([str(e.text) for e in temp])
    return {'head': header, 'content': content}

Пример #4

Показать файл

Файл: parseESPN.py Проект: abresler/NBA-Data-Stuff

def getESPNbox(data_in, mode='url'):
    '''
    url is a box score url obtained from score-summary ESPN page;
    use BeautifulSoup to parse apart data_in; all relevant data found
    in 'table' HTML structures, hence we grab those;
    '''
    tables          = genBSandURLtools.getDataType(data_in, 'table', mode)
    summary         = [t for t in tables if t.text.find('STARTERS') > -1]
    if summary:
        summary     = summary[0].findAll('tr')
    else:
        raise AttributeError, "Houston, there is a f*****g problem"
    details         = []
    content         = []
    for line in summary:
        '''
        "details" are headers, teams stuff;
        "content" is actual player data
        '''
        details.append([str(h.text) for h in line.findAll('th')])
        content.append([str(h.text) for h in line.findAll('td')])
    playerlink_dict = getESPNplayerlinks(summary)
    return {'details':details, 'content':content,
            'playerlinks':playerlink_dict}