crdanielbusch
/
FAOSTAT_data_primap


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
							import os
import subprocess
from pathlib import Path


def test_read_data_set(tmp_path):
    # we need to download first for the CI tests
    script_path = (
        Path(__file__).parent.parent.parent / "scripts" / "download_all_domains.py"
    )
    command = [
        "poetry",
        "run",
        "python3",
        str(script_path),
    ]
    result_download = subprocess.run(
        command,  # noqa: S603
        capture_output=True,
        text=True,
        check=False,
    )
    assert result_download.returncode == 0, f"Script failed: {result_download.stderr}"

    # then read data
    script_path = Path(__file__).parent.parent.parent / "scripts" / "read_data_set.py"
    command = [
        "poetry",
        "run",
        "python3",
        str(script_path),
        "--save_path",
        str(tmp_path),
        "--run_id",
        "2024",
    ]
    result_read = subprocess.run(command, capture_output=True, text=True, check=False)  # noqa: S603
    assert result_read.returncode == 0, f"Script failed: {result_read.stderr}"

    # check output files
    release_folder = os.listdir(tmp_path)
    # there should be one directory created
    assert len(release_folder) == 1
    # and it starts with "v" (the date changes with each release)
    assert release_folder[0].startswith("v")

    output_files = os.listdir(tmp_path / release_folder[0])
    # in the folder there should be three files
    assert len(output_files) == 3

    # a .yaml, .csv, and .nc file
    required_extensions = {"nc", "csv", "yaml"}
    file_extensions = {file.split(".")[-1] for file in output_files}
    assert required_extensions == file_extensions