преди 8 месеца · b0767d4bef
--- a/src/unfccc_ghg_data/unfccc_reader/Saint_Kitts_and_Nevis/config_kna_bur1.py
+++ b/src/unfccc_ghg_data/unfccc_reader/Saint_Kitts_and_Nevis/config_kna_bur1.py
@@ -5,10 +5,10 @@ Tables to read:
 
															 - The sector tables in the Annex from page 149 - done
														
 
															 - trend tables page 111-113 - done
														
 
															 - page 116 - done
														
 
															-- page 118- work in progress
														
 
															-- page 119
														
 
															-- page 121
														
 
															-- page 124
														
 
															+- page 118 - done
														
 
															+- page 119 - done
														
 
															+- page 121 - done
														
 
															+- page 123 - wip
														
 
															 Not reading:
														
 
															 - page 97 - trend table with data for 2008, because it's in the trend tables from page 111
														
@@ -70,6 +70,144 @@ conf_general = {
 
															 }
														
 
															 conf_trend = {
														
 
															+    "fugitive": {
														
 
															+        "rows_to_fix": {2: ["1.B.3 - Other emissions from"]},
														
 
															+        "page_defs": {
														
 
															+            "125": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 2,
														
 
															+            },
														
 
															+            "126": {
														
 
															+                "read_params": dict(
														
 
															+                    flavor="stream",
														
 
															+                    table_areas=["72,681,564,638"],
														
 
															+                    columns=["203,238,272,305,340,370,402,439,469,504,536"],
														
 
															+                ),
														
 
															+                "skip_rows_start": 1,
														
 
															+            },
														
 
															+        },
														
 
															+        "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															+        "unit": "GgCO2eq",
														
 
															+        "header": ["orig_category"],
														
 
															+        "years": [
														
 
															+            "2008",
														
 
															+            "2009",
														
 
															+            "2010",
														
 
															+            "2011",
														
 
															+            "2012",
														
 
															+            "2013",
														
 
															+            "2014",
														
 
															+            "2015",
														
 
															+            "2016",
														
 
															+            "2017",
														
 
															+            "2018",
														
 
															+        ],
														
 
															+        "extra_columns": [],
														
 
															+    },
														
 
															+    "other_sectors": {
														
 
															+        "page_defs": {
														
 
															+            "123": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 2,
														
 
															+            },
														
 
															+        },
														
 
															+        "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															+        "unit": "GgCO2eq",
														
 
															+        "header": ["orig_category"],
														
 
															+        "years": [
														
 
															+            "2008",
														
 
															+            "2009",
														
 
															+            "2010",
														
 
															+            "2011",
														
 
															+            "2012",
														
 
															+            "2013",
														
 
															+            "2014",
														
 
															+            "2015",
														
 
															+            "2016",
														
 
															+            "2017",
														
 
															+            "2018",
														
 
															+        ],
														
 
															+        "extra_columns": [],
														
 
															+    },
														
 
															+    "transport_sub": {
														
 
															+        "page_defs": {
														
 
															+            "121": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 2,
														
 
															+            },
														
 
															+            "122": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 0,
														
 
															+            },
														
 
															+        },
														
 
															+        "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															+        "unit": "GgCO2eq",
														
 
															+        "header": ["orig_category"],
														
 
															+        "years": [
														
 
															+            "2008",
														
 
															+            "2009",
														
 
															+            "2010",
														
 
															+            "2011",
														
 
															+            "2012",
														
 
															+            "2013",
														
 
															+            "2014",
														
 
															+            "2015",
														
 
															+            "2016",
														
 
															+            "2017",
														
 
															+            "2018",
														
 
															+        ],
														
 
															+        "extra_columns": [],
														
 
															+    },
														
 
															+    "transport": {
														
 
															+        "page_defs": {
														
 
															+            "119": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 2,
														
 
															+            }
														
 
															+        },
														
 
															+        "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															+        "unit": "GgCO2eq",
														
 
															+        "header": ["orig_category"],
														
 
															+        "years": [
														
 
															+            "2008",
														
 
															+            "2009",
														
 
															+            "2010",
														
 
															+            "2011",
														
 
															+            "2012",
														
 
															+            "2013",
														
 
															+            "2014",
														
 
															+            "2015",
														
 
															+            "2016",
														
 
															+            "2017",
														
 
															+            "2018",
														
 
															+        ],
														
 
															+        "extra_columns": [],
														
 
															+    },
														
 
															+    "manufacturing_and_construction": {
														
 
															+        "page_defs": {
														
 
															+            "118": {
														
 
															+                "read_params": dict(flavor="lattice"),
														
 
															+                "skip_rows_start": 2,
														
 
															+            }
														
 
															+        },
														
 
															+        "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															+        "unit": "GgCO2eq",
														
 
															+        "header": ["orig_category"],
														
 
															+        "years": [
														
 
															+            "2008",
														
 
															+            "2009",
														
 
															+            "2010",
														
 
															+            "2011",
														
 
															+            "2012",
														
 
															+            "2013",
														
 
															+            "2014",
														
 
															+            "2015",
														
 
															+            "2016",
														
 
															+            "2017",
														
 
															+            "2018",
														
 
															+        ],
														
 
															+        "extra_columns": [],
														
 
															+    },
														
 
															     "energy_industries": {
														
 
															         "entity": f"KYOTOGHG ({gwp_to_use})",
														
 
															         "unit": "GgCO2eq",
														
@@ -107,6 +245,8 @@ conf_trend = {
 
															         },
														
 
															     },
														
 
															     "overview": {
														
 
															+        # Inconsistencies for table page 11 and page 125 for categories 1.B, 1.B.1 and 1.B.2
														
 
															+        "rows_to_drop": ["1B", "1B1", "1B2"],
														
 
															         "fix_single_value": {
														
 
															             "cat": "MBIO",
														
 
															             "year": "2018",
														
--- a/src/unfccc_ghg_data/unfccc_reader/Saint_Kitts_and_Nevis/read_KNA_BUR1_from_pdf.py
+++ b/src/unfccc_ghg_data/unfccc_reader/Saint_Kitts_and_Nevis/read_KNA_BUR1_from_pdf.py
@@ -99,9 +99,10 @@ if __name__ == "__main__":
 
															         # Remove line break characters
														
 
															         df_table["category"] = df_table["category"].str.replace("\n", " ")
														
 
															         # first the manual replacements
														
 
															-        df_table["category"] = df_table["category"].replace(
														
 
															-            conf_trend[table]["cat_codes_manual"]
														
 
															-        )
														
 
															+        if "cat_codes_manual" in conf_trend[table].keys():
														
 
															+            df_table["category"] = df_table["category"].replace(
														
 
															+                conf_trend[table]["cat_codes_manual"]
														
 
															+            )
														
 
															         # remove dots from category codes
														
 
															         df_table["category"] = df_table["category"].str.replace(".", "")
														
 
															         # then the regex replacements
														
@@ -111,11 +112,18 @@ if __name__ == "__main__":
 
															         df_table = df_table.drop(columns="orig_category")
														
 
															+        # drop rows if needed
														
 
															+        if "rows_to_drop" in conf_trend[table].keys():
														
 
															+            for row in conf_trend[table]["rows_to_drop"]:
														
 
															+                row_to_delete = df_table.index[df_table["category"] == row][0]
														
 
															+                df_table = df_table.drop(index=row_to_delete)
														
 
															+
														
 
															         # clean values
														
 
															         for year in conf_trend[table]["years"]:
														
 
															-            df_table[year] = df_table[year].replace(
														
 
															-                conf_trend[table]["replace_data_entries"]
														
 
															-            )
														
 
															+            if "replace_data_entries" in conf_trend[table].keys():
														
 
															+                df_table[year] = df_table[year].replace(
														
 
															+                    conf_trend[table]["replace_data_entries"]
														
 
															+                )
														
 
															             df_table[year] = df_table[year].str.replace("\n", "")
														
 
															             df_table[year] = df_table[year].str.replace(",", ".")
														
 
															             # invisible numbers in trend table on page 112
														
@@ -152,6 +160,8 @@ if __name__ == "__main__":
 
															             ).reset_index(drop=True)
														
 
															         # break
														
 
															+    # some categories present in main and detailled tables
														
 
															+    df_trend = df_trend.drop_duplicates()
														
 
															     df_trend_if = pm2.pm2io.convert_wide_dataframe_if(
														
 
															         df_trend,
														
@@ -284,4 +294,27 @@ if __name__ == "__main__":
 
															     print("Converting to primap2 format.")
														
 
															     data_main_pm2 = pm2.pm2io.from_interchange_format(df_main_IF)
														
 
															-    pass
														
 
															+    # # ###
														
 
															+    # # Merge tables.
														
 
															+    # # ###
														
 
															+
														
 
															+    print("Merging main and trend table.")
														
 
															+    data_pm2 = data_main_pm2.pr.merge(data_trend_pm2, tolerance=1)
														
 
															+
														
 
															+    # # ###
														
 
															+    # # Save raw data to IF and native format.
														
 
															+    # # ###
														
 
															+
														
 
															+    data_if = data_pm2.pr.to_interchange_format()
														
 
															+
														
 
															+    pm2.pm2io.write_interchange_format(
														
 
															+        output_folder / (output_filename + coords_terminologies["category"] + "_raw"),
														
 
															+        data_if,
														
 
															+    )
														
 
															+
														
 
															+    encoding = {var: compression for var in data_pm2.data_vars}
														
 
															+    data_pm2.pr.to_netcdf(
														
 
															+        output_folder
														
 
															+        / (output_filename + coords_terminologies["category"] + "_raw.nc"),
														
 
															+        encoding=encoding,
														
 
															+    )