Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Get unit tests passing in the build #161

Merged
merged 2 commits into from
Oct 13, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .github/workflows/python-app.yml
Original file line number Diff line number Diff line change
Expand Up @@ -41,7 +41,7 @@ jobs:
flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
- name: Test with unittest
run: |
SKIP_SLOW=true python -m unittest discover -v -s ./src/tester
SKIP_SLOW=true python -m unittest -v
- name: Build documentation
run: |
sphinx-build -b html docs build
Expand Down
10 changes: 5 additions & 5 deletions src/orchestrator/__init__.py
Original file line number Diff line number Diff line change
@@ -1,10 +1,10 @@
import sys, os, csv
import os, csv

# Import all of the programs modules within the parent_dir
import scraper
import parser
import cleaner
import updater
from .. import scraper
from .. import parser
from .. import cleaner
from .. import updater

class Orchestrator:
def __init__(self):
Expand Down
8 changes: 2 additions & 6 deletions src/tester/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -9,11 +9,7 @@ Once you've loaded the repository in Visual Studio, you can load the test by usi
{
"python.testing.unittestEnabled": true,
"python.testing.unittestArgs": [
"-v",
"-s",
"./src/tester",
"-p",
"test*.py"
"-v"
]
}
```
Expand Down Expand Up @@ -97,4 +93,4 @@ In progress.

### E. Orchestrator Tests

In progress.
In progress.
Empty file added src/tester/__init__.py
Empty file.
91 changes: 30 additions & 61 deletions src/tester/test_unittest.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,35 +9,31 @@
from bs4 import BeautifulSoup

# Import all of the programs modules within the parent_dir
from scraper import Scraper
from parser import Parser
from cleaner import Cleaner
from updater import Updater
from .. import scraper
from .. import parser
from .. import cleaner
from .. import updater

current_dir = os.path.dirname(os.path.abspath(__file__))
parent_dir = os.path.dirname(current_dir)
project_root = os.path.dirname(parent_dir)

sys.path.append(parent_dir)

SKIP_SLOW = os.getenv("SKIP_SLOW", "false").lower().strip() == "true"


def log(
message, level="INFO"
): # Provide message and info level (optional, defaulting to info)
# configure the logger
log = logging.getLogger(name="pid: " + str(os.getpid()))
logging.basicConfig()
logging.root.setLevel(level=level)
log = logging.getLogger(__name__)
log.info(message)


class ScraperTestCase(unittest.TestCase):
# Defaults for each program are set at the function level.

def test_scrape_get_ody_link(self, county="hays"):
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
logger = scraper_instance.configure_logger()
county = scraper_instance.format_county(county)
base_url = scraper_instance.get_ody_link(county, logger)
Expand All @@ -57,7 +53,7 @@ def test_scrape_main_page(
case_html_path=None,
county="hays",
):
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
logger = scraper_instance.configure_logger()
(
ms_wait,
Expand Down Expand Up @@ -130,7 +126,7 @@ def test_scrape_search_page(
# Parse the HTML content with BeautifulSoup
main_soup = BeautifulSoup(main_page_html, "html.parser")
# Look for the court calendar link
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
logger = scraper_instance.configure_logger()
(
ms_wait,
Expand Down Expand Up @@ -234,7 +230,7 @@ def test_get_hidden_values(
search_soup = BeautifulSoup(search_page_html, "html.parser")

# Run the function
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
logger = scraper_instance.configure_logger()
(
ms_wait,
Expand Down Expand Up @@ -298,7 +294,7 @@ def test_scrape_individual_case(
os.makedirs(case_html_path, exist_ok=True)

# Call the functions being tested. In this case, the functions being called are all of the subfunctions required and effectively replicates the shape of scrape.
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
(
ms_wait,
start_date,
Expand Down Expand Up @@ -401,7 +397,7 @@ def test_scrape_individual_case(
case_number_html == "CR-16-0002-A",
"The cause number is not where it was expected to be in the HTML.",
)
# self.logger.info(f"Scraper test sucessful for cause number CR-16-0002-A.")
# self.logger.info(f"scraper.Scraper test sucessful for cause number CR-16-0002-A.")

# This begins the tests related the scrape_cases function for scraping multiple cases.

Expand All @@ -424,7 +420,7 @@ def test_scrape_jo_list(
case_html_path=None,
):
# This test requires that certain dependency functions run first.
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
(
ms_wait,
start_date,
Expand Down Expand Up @@ -517,7 +513,7 @@ def test_scrape_results_page(
) # Read the entire file content into a string
hidden_values = hidden_values.replace("'", '"')
hidden_values = json.loads(hidden_values)
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
(
ms_wait,
start_date,
Expand Down Expand Up @@ -669,7 +665,7 @@ def test_scrape_multiple_cases(
hidden_values = json.loads(hidden_values)

# There are some live depency functions that have to be run before the primary code can be run.
scraper_instance = Scraper()
scraper_instance = scraper.Scraper()
(
ms_wait,
start_date,
Expand Down Expand Up @@ -789,53 +785,41 @@ def setUp(self):
self.case_json_path = os.path.join(self.test_dir, "hays", "case_json")
os.makedirs(self.case_json_path, exist_ok=True)

self.mock_logger = MagicMock()
self.parser_instance = Parser()
self.mock_logger = logging.getLogger(__name__)
self.parser_instance = parser.Parser()
self.case_html_path = os.path.abspath(
os.path.join(
os.path.dirname(__file__), "../../resources/test_files/parser_testing"
)
)

@patch("parser.Parser.get_class_and_method")
def test_parser_class_and_method(self, mock_import_module):
mock_logger = MagicMock()
mock_class = MagicMock()
mock_method = MagicMock()

mock_import_module.return_value = mock_class.return_value, mock_method

parser_instance = Parser()
def test_parser_class_and_method(self):
parser_instance = parser.Parser()

instance, method = parser_instance.get_class_and_method(
logger=mock_logger, county="hays", test=True
logger=self.mock_logger, county="hays", test=True
)

self.assertEqual(instance, mock_class.return_value)
self.assertEqual(method, mock_method)
self.assertIn('extract_rows', dir(instance))

@patch("os.makedirs")
def test_parser_directories_single_file(self, mock_makedirs):
mock_logger = MagicMock()
parser_instance = Parser()
parser_instance = parser.Parser()
case_html_path, case_json_path = parser_instance.get_directories(
"hays", mock_logger, parse_single_file=True
"hays", self.mock_logger, parse_single_file=True
)

base_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", ".."))
expected_path = os.path.join(base_dir, "resources", "test_files")

self.assertEqual(case_html_path, expected_path)
self.assertEqual(case_json_path, expected_path)
mock_logger.info.assert_called()

@patch("os.makedirs")
@patch("os.path.exists", return_value=False)
def test_parser_directories_multiple_files(self, mock_exists, mock_makedirs):
mock_logger = MagicMock()
parser_instance = Parser()
parser_instance = parser.Parser()
case_html_path, case_json_path = parser_instance.get_directories(
"hays", mock_logger, parse_single_file=False
"hays", self.mock_logger, parse_single_file=False
)

base_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", ".."))
Expand All @@ -845,7 +829,6 @@ def test_parser_directories_multiple_files(self, mock_exists, mock_makedirs):
self.assertEqual(case_html_path, expected_html_path)
self.assertEqual(case_json_path, expected_json_path)
mock_makedirs.assert_called_once_with(expected_json_path, exist_ok=True)
mock_logger.info.assert_called()

def test_parser_list_of_single_html_file(self):
case_number = "51652356"
Expand All @@ -862,7 +845,6 @@ def test_parser_list_of_single_html_file(self):
expected_path = os.path.join(relative_path, f"test_{case_number}.html")

self.assertEqual(case_list, [expected_path])
self.mock_logger.info.assert_called()

def test_parser_list_of_single_html_file_by_casenumber(self):
case_number = "51652356"
Expand All @@ -880,10 +862,8 @@ def test_parser_list_of_single_html_file_by_casenumber(self):
expected_list = [os.path.join(relative_path, f"test_{case_number}.html")]

self.assertEqual(case_list, expected_list)
self.mock_logger.info.assert_called()

@patch("os.path.join", side_effect=lambda *args: "\\".join(args))
def test_parser_list_of_multiple_html_files(self, mock_join):
def test_parser_list_of_multiple_html_files(self):
os.makedirs(self.case_html_path, exist_ok=True)

with open(os.path.join(self.case_html_path, "test_1.html"), "w") as f:
Expand All @@ -907,7 +887,6 @@ def test_parser_list_of_multiple_html_files(self, mock_join):
]

self.assertEqual(set(case_list), set(expected_list))
self.mock_logger.info.assert_called()

def test_parser_get_list_of_html_error_handling(self):
invalid_path = "invalid/path"
Expand All @@ -921,43 +900,34 @@ def test_parser_get_list_of_html_error_handling(self):
self.mock_logger,
parse_single_file=False,
)
self.mock_logger.info.assert_called()

@patch("os.path.join")
@patch("logging.getLogger")
def test_get_html_path(self, mock_logger, mock_path_join):
def test_get_html_path(self):
updated_html_path = os.path.join(self.case_html_path, "multiple_html_files")
case_html_file_name = "parserTest_51652356.html"
case_number = "51652356"

mock_path_join.return_value = f"{updated_html_path}/{case_html_file_name}"

result = self.parser_instance.get_html_path(
updated_html_path, case_html_file_name, case_number, self.mock_logger
)

self.assertEqual(result, f"{updated_html_path}/{case_html_file_name}")

@patch("builtins.open", new_callable=mock_open)
@patch("json.dumps")
@patch("parser.logging.getLogger")
def test_write_json_data(self, mock_logger, mock_json_dumps, mock_open_func):
def test_write_json_data(self, mock_open_func):
case_json_path = "/mock/path"
case_number = "123456"
case_data = {"data": "value"}

self.parser_instance.write_json_data(
case_json_path, case_number, case_data, mock_logger
case_json_path, case_number, case_data, self.mock_logger
)

mock_open_func.assert_called_once_with(
os.path.join(case_json_path, case_number + ".json"), "w"
)
mock_json_dumps.assert_called_once_with(case_data, indent=4)

@patch("builtins.open", new_callable=mock_open)
@patch("parser.logging.getLogger")
def test_write_error_log(self, mock_logger, mock_open_func):
def test_write_error_log(self, mock_open_func):
county = "hays"
case_number = "123456"

Expand All @@ -972,8 +942,7 @@ def test_write_error_log(self, mock_logger, mock_open_func):

def test_parser_end_to_end(self, county="hays", case_number='123456'):

parser = Parser()
parser.parse(county=county,
self.parser_instance.parse(county=county,
case_number=case_number,
parse_single_file=True,
test = True)
Expand Down
Loading