def test_date_search_basic():
    place_id = "ok_roger_mills"
    day = "2021-07-09"
    case_number = "CV-2021-14"
    site = Oscn(place_id)
    # Returns list of CaseInfo instances
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=False)
    # There should be a single entry for the searched date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    # There shoud be a single case on this day
    assert len(results) == 1
    # Check for presence of other expected data points
    case = results[0]
    assert case.filing_date == day
    assert case.place_id == place_id
    assert case.number == case_number
    assert case.type_short == "Civil Misc. (CV)"
    assert (case.parties_short ==
            "DCP OPERATING COMPANY LP v. ROGER MILLS COUNTY ASSESSOR")
    # And the absence of case detail, since we didn't
    # request case_detail page to be scraped
    assert getattr(case, "judge", None) is None
Beispiel #2
0
def test_small_counties_date_search_basic():
    place_id = 'ok_alfalfa'
    day = '2021-07-01'
    site = Oscn(place_id)
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=False)
    # There should be a single date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    assert dates == set([day])
    cases = sorted(results, key=lambda case: case.number)
    # There should be four cases on this day
    assert len(cases) == 4
    first = results[0]
    # Check for presence of other expected data points
    assert first.place_id == place_id
    assert first.number == 'CJ-2021-00008'
    assert first.filing_date == day
    expected_parties = [
        'BEISEL, JAMIE S (Plaintiff)', 'BUCK, JAMES MELVIN (Plaintiff)',
        'BUCK, MARLENE SUE (Plaintiff)', 'FIRETHORN HOLDINGS, LLC (Defendant)',
        'HADWIGER, KYLE (ATTORNEY)'
    ]
    assert first.parties == expected_parties
    # And the absence of case detail, since we didn't
    # request case_detail page to be scraped
    assert getattr(first, 'judge', None) is None
def test_date_search_multiple_cases():
    place_id = "ok_roger_mills"
    day = "2021-07-12"
    site = Oscn(place_id)
    # Set case_details to True to trigger detail page scraping
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=True)
    # There should be a single date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    # There should two cases on this day
    assert len(results) == 2
    # Check for presence of other expected data points
    first, second = results
    assert first.number == "TR-2021-161"
    assert second.number == "TR-2021-162"
    # Case details should be available
    # Judge
    assert first.judge == "VerSteeg, F. Pat"
    assert second.judge == "VerSteeg, F. Pat"
    # Closed date
    assert first.close_date is None
    assert second.close_date == "07/15/2021"
    # filing date should be standardized
    assert first.filing_date == day
    assert second.filing_date == day
def test_date_search_with_case_details():
    place_id = "ok_roger_mills"
    day = "2021-07-09"
    case_number = "CV-2021-14"
    site = Oscn(place_id)
    # Here we set case_details to True to trigger detail page scraping
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=True)
    # There should be a single date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    # There should only be a single case on this day
    assert len(results) == 1
    case = results[0]
    # Check for presence of other expected data points
    assert case.filing_date == day
    assert case.place_id == place_id
    assert case.number == case_number
    assert case.type_short == "Civil Misc. (CV)"
    assert (case.parties_short ==
            "DCP OPERATING COMPANY LP v. ROGER MILLS COUNTY ASSESSOR")
    # Case details should be available
    assert case.judge == "Weedon, Jill Carpenter"
    assert case.close_date is None
def test_date_search_many_results():
    place_id = "ok_tulsa"
    day = "2021-07-15"
    site = Oscn(place_id)
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=False)
    # There should be a single entry for the searched date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    # There should be many cases on this day
    assert len(results) == 219
    # Test case type section headers
    expected_case_types = set([
        "Civil Misc. (CV)",
        "Civil relief less than $10,000 (CS)",
        "Civil relief more than $10,000 (CJ)",
        "Criminal Felony (CF)",
        "Criminal Miscellaneous (MI)",
        "Criminal Misdemeanor (CM)",
        "Family and Domestic (FD)",
        "Marriage license (ML)",
        "Minister's Credentials (MC)",
        "Miscellaneous Receipts - Criminal (MRC)",
        "Paternity (FP)",
        "Probate (PB)",
        "Protective Order (PO)",
        "Small Claims (SC)",
    ])
    # Quite a few case types as well
    case_types = set([case.type_short for case in results])
    assert case_types == expected_case_types
Beispiel #6
0
def test_small_counties_no_results():
    place_id = 'ok_alfalfa'
    day = '2021-07-04'
    site = Oscn(place_id)
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=False)
    assert len(results) == 0
Beispiel #7
0
def test_small_counties_defaults_to_current_day():
    from court_scraper.platforms.oscn.site import Site as Oscn
    with mock.patch.object(Oscn, 'current_day', '2021-07-01'):
        place_id = 'ok_alfalfa'
        site = Oscn(place_id)
        results = site.search_by_date(case_details=False)
        dates = set([case.filing_date for case in results])
        assert len(dates) == 1
        assert len(results) == 4
def test_date_search_no_results():
    place_id = "ok_roger_mills"
    day = "2021-07-15"
    site = Oscn(place_id)
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=False)
    # There should be no results for this date
    assert len(results) == 0
Beispiel #9
0
def test_small_counties_multiple_day_results():
    place_id = 'ok_alfalfa'
    start = '2021-07-01'
    end = '2021-07-02'
    site = Oscn(place_id)
    results = site.search_by_date(start_date=start,
                                  end_date=end,
                                  case_details=False)
    dates = set([case.filing_date for case in results])
    assert dates == set([start, end])
    assert len(results) == 10
Beispiel #10
0
def test_search_by_case_id(place_id, case_number, expected):
    site = Oscn(place_id)
    results = site.search(case_numbers=[case_number])
    assert site.place_id == place_id
    assert len(results) == 1
    case = results[0]
    assert case.place_id == place_id
    assert case.number == case_number
    assert case.html.startswith("<!DOCTYPE")
    assert case.filing_date == expected["filing_date"]
    assert case.close_date == expected["close_date"]
    assert case.type == expected["type"]
    assert case.judge == expected["judge"]
Beispiel #11
0
def test_date_search_defaults_to_current_day():
    from court_scraper.platforms.oscn.site import Site as Oscn

    with mock.patch.object(Oscn, "current_day", "2021-07-09"):
        place_id = "ok_roger_mills"
        site = Oscn(place_id)
        results = site.search_by_date(case_details=False)
        # There should be a single entry for the searched date
        dates = set([case.filing_date for case in results])
        assert len(dates) == 1
        case = results[0]
        # Check for presence of other expected data points
        assert case.place_id == place_id
        assert case.filing_date == "2021-07-09"
Beispiel #12
0
def test_date_search_multiple_day_results():
    place_id = "ok_roger_mills"
    start = "2021-07-08"
    end = "2021-07-09"
    site = Oscn(place_id)
    results = site.search_by_date(start_date=start,
                                  end_date=end,
                                  case_details=False)
    # Cases should span multiple days
    dates = set([case.filing_date for case in results])
    assert len(dates) == 2
    assert dates == set([start, end])
    # There should be many cases on this day
    assert len(results) == 2
    first = results[0]
    second = results[1]
    assert first.number == "CV-2021-13"
    assert second.number == "CV-2021-14"
Beispiel #13
0
def test_small_counties_case_details():
    place_id = 'ok_alfalfa'
    day = '2021-07-01'
    site = Oscn(place_id)
    # Here we set case_details to True to trigger detail page scraping
    results = site.search_by_date(start_date=day,
                                  end_date=day,
                                  case_details=True)
    # There should be a single entry for the searched date
    dates = set([case.filing_date for case in results])
    assert len(dates) == 1
    first = sorted(results, key=lambda case: case.number)[0]
    # Check for presence of other expected data points
    assert first.filing_date == day
    assert first.place_id == place_id
    assert first.number == 'CJ-2021-00008'
    # Case details should be available
    assert first.type == 'Civil relief more than $10,000: MONEY JUDGMENT'
    assert first.judge == 'ANGLE, LOREN E.'
    assert first.close_date is None
Beispiel #14
0
def test_search_by_case_id_multiple_results():
    site = Oscn("ok_tulsa")
    case_numbers = ["CJ-2021-2045", "CJ-2018-2919"]
    results = site.search(case_numbers=case_numbers)
    assert len(results) == 2