Daniel Busch 4 months ago
parent
commit
0b3d4c4b1e
2 changed files with 5 additions and 3 deletions
  1. 2 1
      src/faostat_data_primap/download.py
  2. 3 2
      src/faostat_data_primap/read.py

+ 2 - 1
src/faostat_data_primap/download.py

@@ -14,7 +14,8 @@ from selenium.webdriver.chrome.options import Options
 from selenium.webdriver.chrome.service import Service
 
 from faostat_data_primap.exceptions import DateTagNotFoundError
-from faostat_data_primap.helper.definitions import domains, downloaded_data_path
+from faostat_data_primap.helper.definitions import domains
+from faostat_data_primap.helper.paths import downloaded_data_path
 
 
 def find_previous_release_path(

+ 3 - 2
src/faostat_data_primap/read.py

@@ -79,7 +79,7 @@ def read_latest_data() -> None:
     for domain, release in files_to_read:
         read_config = read_config_all[domain][release]
 
-        print(f"Read {read_config["filename"]}")
+        print(f"Read {read_config['filename']}")
         dataset_path = downloaded_data_path / domain / release / read_config["filename"]
 
         # There are some non-utf8 characters
@@ -135,9 +135,10 @@ def read_latest_data() -> None:
                 join="outer",
             ).reset_index(drop=True)
 
+    # sometimes Source is empty
     df_all["Source"] = df_all["Source"].fillna("unknown")
 
-    # Rename columns to remove the "Y" prefix
+    # Remove the "Y" prefix for the years columns
     df_all = df_all.rename(columns=lambda x: x.lstrip("Y") if x.startswith("Y") else x)
 
     # Make sure the units are correct