示例#1
0
def processpage(url,i,subber,nextepi,resolution,animename):
	current_time = datetime.now().strftime("%H:%M:%S")
	print('[{}] Processing - {} Episode {}\n====================='.format(current_time,animename,nextepi))
	downloadprefix = 'https://nyaa.si'
	word = pros.obtainjson(url).text
	output_json = html_to_json.convert(word)
	return getrows(output_json,subber,nextepi,resolution,downloadprefix)
示例#2
0
def kona_show(link):
    post_id = filter_post(link)
    base = requests.get(f"https://konachan.com/post/show/{post_id}")
    soup = soupBeauty(base)
    json_ = html_to_json.convert(base.text)
    infodic = {}
    infodic["id"] = post_id
    infodic["tags"] = json_["html"][0]["head"][0]["link"][2]["meta"][0]["meta"][0]["meta"][3]["_attributes"]["content"]
    infodic["tag_split"] = infodic["tags"].split(" ")
    try:
        prbl = json_["html"][0]["body"][0]["div"][6]["div"][0]["div"][2]["a"]
        listparent = []
        for pr in prbl[1:]:
            listparent.append(pr["_value"])
        infodic["parent_id"] = listparent
    except KeyError:
        pass
    except IndexError:
        pass
    try:
        url = soup.find_all(attrs={"class": "original-file-unchanged"})[0].get("href")
    except:
        url = soup.find_all(attrs={"class": "original-file-changed"})[0].get("href")
    infodic["file_ext"] = url[-3:]
    infodic["file_url"] = url
    return infodic
def test_capturing_neither_attributes_nor_values():
    html_string = """<p id='foo'>bingo</p>test  <br/>   <br/>
ing<br/>"""
    json_output = html_to_json.convert(html_string,
                                       capture_element_values=False,
                                       capture_element_attributes=False)
    assert json_output == {'br': [{}, {}, {}], 'p': [{}]}
示例#4
0
def _fetch_clean_data(driver, raw_data, listings_clean):
    raw_data = html_to_json.convert(raw_data)
    listings = raw_data['div'][0]['div'][0]['div'][:-1]
    err = []
    for listing in listings:
        listing_details = listing['div'][0]['div'][0]['div'][0]['div'][0][
            'div'][0]['div'][0]['div'][2]['div']
        item_attributes = listing_details[0]['div']
        ask_price = listing_details[1]['div'][0]['div'][0]['span'][1]['_value']
        att = ''

        for att_json in item_attributes:
            if 'span' in att_json['div'][0]:
                att = att + ' /// ' + att_json['div'][0]['span'][0]['_value']

            elif '_value' in att_json['div'][0]:  #sockets
                sockets = re.findall(r'\d+', att_json['div'][0]['_value'])
                if sockets:
                    att = att + ' /// ' + 'Sockets:' + sockets[0]
            else:
                err.append(att_json)
                continue

        listings_clean.append({'attributes': att, 'ask_price': ask_price})
    return listings_clean, err
def test_not_capturing_element_attributes():
    html_string = """<p id='foo'>bingo</p>test  <br/>   <br/>
ing<br/>"""
    json_output = html_to_json.convert(html_string,
                                       capture_element_attributes=False)
    assert json_output == {
        'br': [{}, {}, {}],
        'p': [{
            '_value': 'bingo'
        }],
        '_values': ['test', 'ing'],
    }
def test_empty_spaces():
    """Make sure empty spaces are not recorded as values."""
    html_string = """<p>bingo</p>test  <br/>   <br/>
ing<br/>"""
    json_output = html_to_json.convert(html_string)
    assert json_output == {
        'br': [{}, {}, {}],
        'p': [{
            '_value': 'bingo'
        }],
        '_values': ['test', 'ing'],
    }
def test_multiple_text_entries():
    """Make sure multiple text entries are handled well."""
    html_string = """<p>bingo</p>test<br/>
ing<br/>"""
    json_output = html_to_json.convert(html_string)
    assert json_output == {
        'br': [{}, {}],
        'p': [{
            '_value': 'bingo'
        }],
        '_values': ['test', 'ing'],
    }
示例#8
0
    def run(self):
        """Run the App main logic.

        This method should contain the core logic of the App.
        """
        html_string = self.tcex.playbook.read(self.args.html_string)
        convert_tables = self.args.convert_tables

        if convert_tables:
            output_json = html_to_json.convert_tables(html_string)
        else:
            output_json = html_to_json.convert(html_string)

        self.tcex.playbook.create_output('htmlToJson.json', output_json,
                                         'String')
        self.exit_message = 'HTML converted to JSON!'
示例#9
0
from urllib import request

import pandas as pd
import requests
import json
import html_to_json

#resp = request.urlopen("https://modelo-prueba.herokuapp.com/")
URL = "https://modelo-prueba.herokuapp.com/result"
DATA = {'a':1, 'b':3, 'c':9}

#r = requests.post(url=URL, data=PARAMS)

r = requests.post(URL,data=DATA)
r_json = html_to_json.convert(r.content)

prob = r_json['html'][0]['body'][0]['h3'][0]['_value']

print(prob)
#print(resp.code)
#print(resp.length)
#print(resp.peek())
def test_pdfexaminer():
    html_string = _read_file('./data/pdfexaminer.com.html')
    json_output = html_to_json.convert(html_string)
    json_output_string = str(json_output)
    assert '33.0@4675: pdf.exploit Corrupted JPEG2000' in json_output_string
    assert '1.0@25957: suspicious.obfuscation using app.setTimeOut to eval code' in json_output_string
def test_missing_content():
    html_string = _read_file('./data/test3_missing_content.html')
    json_output = html_to_json.convert(html_string)
    print('json_output {}'.format(json_output))
    assert 'hxxp://ioa993u.space/vnc.exe' in str(json_output)
    assert '2018-08-22' in str(json_output)
def test_simple_html2():
    html_string = """<ul class='nav navbar-nav navbar-right'>
        <li><a href='http://viper.malwareconfig.com'>Viper</a></li>
        <li><a href='http://aptnotes.malwareconfig.com'>APTNotes</a></li>
        <li><a href='/search/'>Search</a></li>
        <li><a href='#' data-toggle='modal' data-target='#aboutModal'>About</a></li>
        <li class='dropdown'>
          <a href='#' class='dropdown-toggle' data-toggle='dropdown'>Help <span class='caret'></span></a>
          <ul class='dropdown-menu' role='menu'>
            <li><a href='/admin'>Admin</a></li>
            <li><a href='#'>Docs</a></li>
            <li><a href='#'>Issues</a></li>
            <li><a href='#'>ChangeLog</a></li>
            <li class='divider'></li>
            <li><a href='#' data-toggle='modal' data-target='#aboutModal'>About</a></li>
          </ul>
        </li>
      </ul>"""
    json_output = html_to_json.convert(html_string)
    print('json_output {}'.format(json_output))
    assert json_output == {
        'ul': [{
            '_attributes': {
                'class': ['nav', 'navbar-nav', 'navbar-right']
            },
            'li': [
                {
                    'a': [{
                        '_attributes': {
                            'href': 'http://viper.malwareconfig.com'
                        },
                        '_value': 'Viper',
                    }]
                },
                {
                    'a': [{
                        '_attributes': {
                            'href': 'http://aptnotes.malwareconfig.com'
                        },
                        '_value': 'APTNotes',
                    }]
                },
                {
                    'a': [{
                        '_attributes': {
                            'href': '/search/'
                        },
                        '_value': 'Search'
                    }]
                },
                {
                    'a': [{
                        '_attributes': {
                            'href': '#',
                            'data-toggle': 'modal',
                            'data-target': '#aboutModal',
                        },
                        '_value': 'About',
                    }]
                },
                {
                    '_attributes': {
                        'class': ['dropdown']
                    },
                    'a': [{
                        '_attributes': {
                            'href': '#',
                            'class': ['dropdown-toggle'],
                            'data-toggle': 'dropdown',
                        },
                        '_value': 'Help',
                        'span': [{
                            '_attributes': {
                                'class': ['caret']
                            }
                        }],
                    }],
                    'ul': [{
                        '_attributes': {
                            'class': ['dropdown-menu'],
                            'role': 'menu',
                        },
                        'li': [
                            {
                                'a': [{
                                    '_attributes': {
                                        'href': '/admin'
                                    },
                                    '_value': 'Admin',
                                }]
                            },
                            {
                                'a': [{
                                    '_attributes': {
                                        'href': '#'
                                    },
                                    '_value': 'Docs',
                                }]
                            },
                            {
                                'a': [{
                                    '_attributes': {
                                        'href': '#'
                                    },
                                    '_value': 'Issues',
                                }]
                            },
                            {
                                'a': [{
                                    '_attributes': {
                                        'href': '#'
                                    },
                                    '_value': 'ChangeLog',
                                }]
                            },
                            {
                                '_attributes': {
                                    'class': ['divider']
                                }
                            },
                            {
                                'a': [{
                                    '_attributes': {
                                        'href': '#',
                                        'data-toggle': 'modal',
                                        'data-target': '#aboutModal',
                                    },
                                    '_value': 'About',
                                }]
                            },
                        ],
                    }],
                },
            ],
        }]
    }
def test_simple_html1():
    html_string = """<head>
    <title>MalwareConfig - Rule Manager</title>
    <meta charset='UTF-8'>
    <meta name='description' content='Yara Rule Manager'>
    <meta name='google-site-verification' content='zI3MVR02eLr7MZ_BbS_4ZMlqjmmuriRFcvymZ6dD5Vc' />
    <meta name='keywords' content='yara,rules'>
    <link href='/static/css/bootstrap.css' rel='stylesheet'>
    <link href='/static/css/style.css' rel='stylesheet'>
    <script src='https://maps.googleapis.com/maps/api/js?v=3.exp'></script>
</head>"""
    json_output = html_to_json.convert(html_string)
    print('json_output {}'.format(json_output))
    assert json_output == {
        'head': [{
            'title': [{
                '_value': 'MalwareConfig - Rule Manager'
            }],
            'meta': [
                {
                    '_attributes': {
                        'charset': 'UTF-8'
                    }
                },
                {
                    '_attributes': {
                        'name': 'description',
                        'content': 'Yara Rule Manager',
                    }
                },
                {
                    '_attributes': {
                        'name': 'google-site-verification',
                        'content':
                        'zI3MVR02eLr7MZ_BbS_4ZMlqjmmuriRFcvymZ6dD5Vc',
                    },
                    'meta': [{
                        '_attributes': {
                            'name': 'keywords',
                            'content': 'yara,rules',
                        }
                    }],
                    'link': [
                        {
                            '_attributes': {
                                'href': '/static/css/bootstrap.css',
                                'rel': ['stylesheet'],
                            }
                        },
                        {
                            '_attributes': {
                                'href': '/static/css/style.css',
                                'rel': ['stylesheet'],
                            }
                        },
                    ],
                    'script': [{
                        '_attributes': {
                            'src':
                            'https://maps.googleapis.com/maps/api/js?v=3.exp'
                        }
                    }],
                },
            ],
        }]
    }
def test_content_2():
    html_string = _read_file('./data/test2.html')
    json_output = html_to_json.convert(html_string)
    print('json_output {}'.format(json_output))
    assert json_output['html'][0]['body'][0]['div'][0]['div'][3]['table'][0][
        'tr'][1:] == [
            {
                'td': [
                    {
                        '_value': '25546'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/ebae9a144636a11dc7bb42724d830109'
                            },
                            '_value': 'ebae9a144636a11dc7bb42724d830109',
                        }]
                    },
                    {
                        '_value': 'June 20, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25545'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/eed5dcfdaea99ce886ce8cb2bed9425f'
                            },
                            '_value': 'eed5dcfdaea99ce886ce8cb2bed9425f',
                        }]
                    },
                    {
                        '_value': 'June 20, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25544'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/PoisonIvy/'
                            },
                            '_value': 'PoisonIvy',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/ba38eb35dc8e6688e4b4aa4f8951ed7f'
                            },
                            '_value': 'ba38eb35dc8e6688e4b4aa4f8951ed7f',
                        }]
                    },
                    {
                        '_value': 'June 4, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25543'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/PoisonIvy/'
                            },
                            '_value': 'PoisonIvy',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/e167b6311a7c435b4d65287ace236591'
                            },
                            '_value': 'e167b6311a7c435b4d65287ace236591',
                        }]
                    },
                    {
                        '_value': 'June 4, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25542'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/6024467685f74f4129512207b2510e43'
                            },
                            '_value': '6024467685f74f4129512207b2510e43',
                        }]
                    },
                    {
                        '_value': 'May 30, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25541'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/c65c3c8c4035481a6833394476c82ff1'
                            },
                            '_value': 'c65c3c8c4035481a6833394476c82ff1',
                        }]
                    },
                    {
                        '_value': 'May 27, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25540'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/41c60a7201487465e7e06921b20c3ec8'
                            },
                            '_value': '41c60a7201487465e7e06921b20c3ec8',
                        }]
                    },
                    {
                        '_value': 'May 6, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25539'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/d953a90802ca685f564ee9a4562f8304'
                            },
                            '_value': 'd953a90802ca685f564ee9a4562f8304',
                        }]
                    },
                    {
                        '_value': 'May 4, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25538'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/Xtreme/'
                            },
                            '_value': 'Xtreme'
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/7799e36a2e9c54c3ef1c3b379d620d82'
                            },
                            '_value': '7799e36a2e9c54c3ef1c3b379d620d82',
                        }]
                    },
                    {
                        '_value': 'April 27, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25537'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/757e55d3785c8bcebb0c20c764923cfd'
                            },
                            '_value': '757e55d3785c8bcebb0c20c764923cfd',
                        }]
                    },
                    {
                        '_value': 'April 22, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25536'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/376568c88494ccb037c91727e0330a96'
                            },
                            '_value': '376568c88494ccb037c91727e0330a96',
                        }]
                    },
                    {
                        '_value': 'April 22, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25535'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/CyberGate/'
                            },
                            '_value': 'CyberGate',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/b1730fff58fd04367cff9b39b2942d15'
                            },
                            '_value': 'b1730fff58fd04367cff9b39b2942d15',
                        }]
                    },
                    {
                        '_value': 'April 20, 2018, 6:37 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25534'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/222d3bc7996197f02093c156eee501b0'
                            },
                            '_value': '222d3bc7996197f02093c156eee501b0',
                        }]
                    },
                    {
                        '_value': 'April 15, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25533'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/fe36d10f6bb264f0059be752f4d5772e'
                            },
                            '_value': 'fe36d10f6bb264f0059be752f4d5772e',
                        }]
                    },
                    {
                        '_value': 'April 14, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25532'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/5ad6c554bd80683b037bd5cccae435f6'
                            },
                            '_value': '5ad6c554bd80683b037bd5cccae435f6',
                        }]
                    },
                    {
                        '_value': 'April 12, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25531'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/51dd3b397a83c7d4c82d0c7b1a3f2800'
                            },
                            '_value': '51dd3b397a83c7d4c82d0c7b1a3f2800',
                        }]
                    },
                    {
                        '_value': 'April 9, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25530'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/5922c431e3c8868cfd6bb729b6389586'
                            },
                            '_value': '5922c431e3c8868cfd6bb729b6389586',
                        }]
                    },
                    {
                        '_value': 'April 8, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25529'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/f58e5c0213c3d16c0735d5a53ff2b2ce'
                            },
                            '_value': 'f58e5c0213c3d16c0735d5a53ff2b2ce',
                        }]
                    },
                    {
                        '_value': 'April 6, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25528'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/202210615e3d74385e58b6242a1373ea'
                            },
                            '_value': '202210615e3d74385e58b6242a1373ea',
                        }]
                    },
                    {
                        '_value': 'April 2, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25527'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/628abfc87f7e7adaf3bfcf6adad6d167'
                            },
                            '_value': '628abfc87f7e7adaf3bfcf6adad6d167',
                        }]
                    },
                    {
                        '_value': 'April 2, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25526'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/ad20b1d4c948a33f0ffbfdc2aaf5275a'
                            },
                            '_value': 'ad20b1d4c948a33f0ffbfdc2aaf5275a',
                        }]
                    },
                    {
                        '_value': 'April 2, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25525'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/e0ee266cb78120568f5fd139d0f60f94'
                            },
                            '_value': 'e0ee266cb78120568f5fd139d0f60f94',
                        }]
                    },
                    {
                        '_value': 'April 2, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25524'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/b7e97ed0da34cc9991d729c35f0249c7'
                            },
                            '_value': 'b7e97ed0da34cc9991d729c35f0249c7',
                        }]
                    },
                    {
                        '_value': 'April 2, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25523'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/DarkComet/'
                            },
                            '_value': 'DarkComet',
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/dc141691c1b1530896f13594a17f62d6'
                            },
                            '_value': 'dc141691c1b1530896f13594a17f62d6',
                        }]
                    },
                    {
                        '_value': 'March 26, 2018, 6:25 a.m.'
                    },
                ]
            },
            {
                'td': [
                    {
                        '_value': '25522'
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href': '/stats/Xtreme/'
                            },
                            '_value': 'Xtreme'
                        }]
                    },
                    {
                        'a': [{
                            '_attributes': {
                                'href':
                                '/config/81160e72402be519311eb81cf4775f6f'
                            },
                            '_value': '81160e72402be519311eb81cf4775f6f',
                        }]
                    },
                    {
                        '_value': 'March 25, 2018, 6:25 a.m.'
                    },
                ]
            },
        ]
def test_content_1():
    html_string = _read_file('./data/test1.html')
    json_output = html_to_json.convert(html_string)