2 gadi atpakaļ · 3515b17f31
--- a/code/UNFCCC_reader/Taiwan/config_TWN_NIR2022.py
+++ b/code/UNFCCC_reader/Taiwan/config_TWN_NIR2022.py
@@ -0,0 +1,361 @@
 
				+# config and functions for Taiwan NIR 2022
			
 
				+
			
 
				+from typing import Union, List
			
 
				+import pandas as pd
			
 
				+
			
 
				+gwp_to_use = "AR4GWP100"
			
 
				+
			
 
				+def fix_rows(data: pd.DataFrame, rows_to_fix: list, col_to_use: str, n_rows: int)->pd.DataFrame:
			
 
				+    for row in rows_to_fix:
			
 
				+        #print(row)
			
 
				+        # find the row number and collect the row and the next two rows
			
 
				+        index = data.loc[data[col_to_use] == row].index
			
 
				+        if not list(index):
			
 
				+            print(f"Can't merge split row {row}")
			
 
				+            print(data[col_to_use])
			
 
				+        print(f"Merging split row {row}")
			
 
				+        indices_to_drop = []
			
 
				+        ####print(index)
			
 
				+        for item in index:
			
 
				+            loc = data.index.get_loc(item)
			
 
				+            ####print(data[col_to_use].loc[loc + 1])
			
 
				+            if n_rows == -2:
			
 
				+                locs_to_merge = list(range(loc - 1, loc + 1))
			
 
				+                loc_to_check = loc - 1
			
 
				+            #if n_rows == -3:
			
 
				+            #    locs_to_merge = list(range(loc - 1, loc + 2))
			
 
				+            #elif n_rows == -5:
			
 
				+            #    locs_to_merge = list(range(loc - 1, loc + 4))
			
 
				+            else:
			
 
				+                locs_to_merge = list(range(loc, loc + n_rows))
			
 
				+                loc_to_check = loc + 1
			
 
				+            
			
 
				+            if data[col_to_use].loc[loc_to_check] == '':
			
 
				+                rows_to_merge = data.iloc[locs_to_merge]
			
 
				+                indices_to_merge = rows_to_merge.index
			
 
				+                # replace numerical NaN values
			
 
				+                ####print(rows_to_merge)
			
 
				+                rows_to_merge = rows_to_merge.fillna('')
			
 
				+                ####print("fillna")
			
 
				+                ####print(rows_to_merge)
			
 
				+                # join the three rows
			
 
				+                new_row = rows_to_merge.agg(' '.join)
			
 
				+                # replace the double spaces that are created 
			
 
				+                # must be done here and not at the end as splits are not always 
			
 
				+                # the same and join would produce different col values
			
 
				+                new_row = new_row.str.replace("  ", " ")  
			
 
				+                new_row = new_row.str.strip()
			
 
				+                #new_row = new_row.str.replace("N O", "NO") 
			
 
				+                #new_row = new_row.str.replace(", N", ",N")
			
 
				+                #new_row = new_row.str.replace("- ", "-")
			
 
				+                data.loc[indices_to_merge[0]] = new_row
			
 
				+                indices_to_drop = indices_to_drop + list(indices_to_merge[1:])
			
 
				+        
			
 
				+        data = data.drop(indices_to_drop)
			
 
				+        data = data.reset_index(drop=True)
			
 
				+    return data
			
 
				+
			
 
				+def make_wide_table(data: pd.DataFrame, keyword: str, col: Union[int, str], index_cols: List[Union[int, str]])->pd.DataFrame:
			
 
				+    index = data.loc[data[col] == keyword].index
			
 
				+    if not list(index):
			
 
				+        print("Keyword for table transformation not found")
			
 
				+        return data
			
 
				+    elif len(index)==1:
			
 
				+        print("Keyword for table transformation found only once")
			
 
				+        return data
			
 
				+    else:
			
 
				+        df_all = None
			
 
				+        for i, item in enumerate(index):
			
 
				+            loc = data.index.get_loc(item)
			
 
				+            if i < len(index) - 1:
			
 
				+                next_loc = data.index.get_loc(index[i + 1])
			
 
				+            else:
			
 
				+                next_loc = data.index[-1] + 1
			
 
				+            df_to_add = data.loc[list(range(loc, next_loc))]
			
 
				+            # select only cols which don't have NaN, Null, or '' as header
			
 
				+            filter_nan = ((~df_to_add.iloc[0].isnull()) & (df_to_add.iloc[0] != 'NaN')& (df_to_add.iloc[0] != ''))
			
 
				+            df_to_add = df_to_add.loc[: , filter_nan]
			
 
				+            df_to_add.columns = df_to_add.iloc[0]
			
 
				+            #print(df_to_add.columns)
			
 
				+            df_to_add = df_to_add.drop(loc)
			
 
				+            df_to_add = df_to_add.set_index(index_cols)
			
 
				+            
			
 
				+            if df_all is None:
			
 
				+                df_all = df_to_add
			
 
				+            else:
			
 
				+                df_all = pd.concat([df_all, df_to_add], axis=1, join='outer')
			
 
				+        return df_all
			
 
				+        
			
 
				+
			
 
				+# page defs tp hold information on reading the table
			
 
				+page_defs = {
			
 
				+    '5': { 
			
 
				+        "table_areas": ['36,523,563,68'],
			
 
				+        "split_text": False,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '6': {
			
 
				+        "table_areas": ['34,562,563,53'],
			
 
				+        #"columns": ['195,228,263,295,328,363,395,428,462,495,529'], # works without
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '7': {
			
 
				+        "table_areas": ['36,740,499,482', '36,430,564,53'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '8': {
			
 
				+        "table_areas": ['35,748,503,567'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '9': {
			
 
				+        "table_areas": ['35,747,565,315', '36,273,565,50'],
			
 
				+        "split_text": False,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '11': {
			
 
				+        "table_areas": ['35,744,563,434'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '12': {
			
 
				+        "table_areas": ['33,747,562,86'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '13': {
			
 
				+        "table_areas": ['34,303,564,54'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '14': {
			
 
				+        "table_areas": ['34,754,564,256'],
			
 
				+        "columns": ['220,251,283,314,344,371,406,438,470,500,530'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '15': {
			
 
				+        "table_areas": ['34,487,564,42'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+    '16': {
			
 
				+        "table_areas": ['34,418,564,125'],
			
 
				+        #"columns": ['107,209,241,273,306,338,369,402,433,466,498,533'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "lattice",
			
 
				+    }, # with stream the row index is messed up with lattice the column index ... red with lattice and fix col header manualy
			
 
				+    '17': {
			
 
				+        "table_areas": ['34,534,564,49'],
			
 
				+        "columns": ['188,232,263,298,331,362,398,432,464,497,530'],
			
 
				+        "split_text": True,
			
 
				+        "flavor": "stream",
			
 
				+    },
			
 
				+}
			
 
				+
			
 
				+# table defs to hold information on how to process the tables
			
 
				+table_defs = {
			
 
				+    'ES2.2': { # 1990-2020 Carbon Dioxide Emissions and Sequestration in Taiwan
			
 
				+        "tables": [1, 2],
			
 
				+        "rows_to_fix": {
			
 
				+            0: { 
			
 
				+                3: ['1.A.4.c Agriculture, Forestry, Fishery, and',
			
 
				+                    '2.D Non-Energy Products from Fuels and', 
			
 
				+                    '4. Land Use, Land Use Change and Forestry'],
			
 
				+            },
			
 
				+        },
			
 
				+        "index_cols": ['GHG Emission Source and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Source and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "entity": "CO2",
			
 
				+        "unit": "kt",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Net GHG Emission (including LULUCF)': '0',
			
 
				+            'Total GHG Emission (excluding LULUCF)': 'M.0.EL',
			
 
				+        },            
			
 
				+    },
			
 
				+    'ES2.3': { # 1990-2020 Methane Emissions in Taiwan
			
 
				+        "tables": [3, 4],
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "entity": f"CH4 ({gwp_to_use})",
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total Methane Emissions': '0',
			
 
				+        },
			
 
				+    },
			
 
				+    'ES2.4': { # 1990-2020 Nitrous Oxide Emissions in Taiwan
			
 
				+        "tables": [5],
			
 
				+        "fix_cats": {
			
 
				+            0: {
			
 
				+                "Total Nitrous Oxide Emissionsl": "Total Nitrous Oxide Emissions",
			
 
				+            },
			
 
				+        },            
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "entity": f"N2O ({gwp_to_use})",
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total Nitrous Oxide Emissions': '0',
			
 
				+        },        
			
 
				+    },
			
 
				+    'ES3.1': { # 1990-2020 Greenhouse Gas Emission in Taiwan by Sector
			
 
				+        "tables": [7],
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "entity": f"KYOTOGHG ({gwp_to_use})",
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Net GHG Emission (including LULUCF)': '0',
			
 
				+            'Total GHG Emission (excluding LULUCF)': 'M.0.EL',
			
 
				+        },
			
 
				+    },
			
 
				+    'ES3.2': { # 1990-2020 Greenhouse Gas Emissions Produced by Energy Sector in Taiwan
			
 
				+        "tables": [8],
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "gas_splitting": {
			
 
				+            "Total CO2 Emission": "CO2",
			
 
				+            "Total CH4 Emission": f"CH4 ({gwp_to_use})",
			
 
				+            "Total N2O Emission": f"N2O ({gwp_to_use})",
			
 
				+            "Total Emission from Energy Sector": f"KYOTOGHG ({gwp_to_use})",
			
 
				+            "GHG Emission Sources and Sinks": "entity",
			
 
				+        },
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total CO2 Emission': '1',
			
 
				+            'Total CH4 Emission': '1',
			
 
				+            'Total N2O Emission': '1',
			
 
				+            'Total Emission from Energy Sector': '1',
			
 
				+        },
			
 
				+    },
			
 
				+    'ES3.3': { # 1990-2020 Greenhouse Gas Emissions Produced by Industrial Process and Product Use Sector (IPPU) in Taiwan
			
 
				+        "tables": [9,10],
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "gas_splitting": {
			
 
				+            "Total CO2 Emission": "CO2",
			
 
				+            "Total CH4 Emission": f"CH4 ({gwp_to_use})",
			
 
				+            "Total N2O Emission": f"N2O ({gwp_to_use})",
			
 
				+            "Total HFCs Emission": f"HFCS ({gwp_to_use})",
			
 
				+            "Total PFCs Emission (2.E Electronics Industry)": f"PFCS ({gwp_to_use})",
			
 
				+            "Total SF6 Emission": f"SF6 ({gwp_to_use})",
			
 
				+            "Total NF3 Emission (2.E Electronics Industry)": f"NF3 ({gwp_to_use})",
			
 
				+            "Total Emission from IPPU Sector": f"KYOTOGHG ({gwp_to_use})",
			
 
				+            "GHG Emission Sources and Sinks": "entity",
			
 
				+        },
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total CO2 Emission': '2',
			
 
				+            'Total CH4 Emission': '2',
			
 
				+            'Total N2O Emission': '2',
			
 
				+            'Total HFCs Emission': '2',
			
 
				+            'Total PFCs Emission (2.E Electronics Industry)': '2.E',
			
 
				+            'Total SF6 Emission': '2',
			
 
				+            'Total NF3 Emission (2.E Electronics Industry)': '2.E',
			
 
				+            'Total Emission from IPPU Sector': '2',
			
 
				+        },
			
 
				+        "drop_rows": [
			
 
				+            ("2.D Non-Energy Products from Fuels and Solvent Use", "CO2"), # has lower significant digits than in table ES2.2
			
 
				+        ]
			
 
				+    }, 
			
 
				+    'ES3.4': { # 1990-2020 Greenhouse Gas Emissions Produced by Agriculture Sector in Taiwan
			
 
				+        "tables": [11],
			
 
				+        "rows_to_fix": {},
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "gas_splitting": {
			
 
				+            "Total CO2 Emission (3.H Urea applied)": "CO2",
			
 
				+            "Total CH4 Emission": f"CH4 ({gwp_to_use})",
			
 
				+            "Total N2O Emission": f"N2O ({gwp_to_use})",
			
 
				+            "Total Emission From Agriculture Sector": f"KYOTOGHG ({gwp_to_use})",
			
 
				+            "GHG Emission Sources and Sinks": "entity",
			
 
				+        },
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total CO2 Emission (3.H Urea applied)': '3.H',
			
 
				+            'Total CH4 Emission': '3',
			
 
				+            'Total N2O Emission': '3',
			
 
				+            'Total Emission From Agriculture Sector': '3',
			
 
				+        },
			
 
				+    }, 
			
 
				+    'ES3.6': { # 1990-2020 Greenhouse Gas Emissions in Taiwan by Waste Sector
			
 
				+        "tables": [13],
			
 
				+        "rows_to_fix": {
			
 
				+            0: {
			
 
				+                3: ["Total CO2 Emission"],
			
 
				+            },
			
 
				+        }, 
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'], 
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, # two column header
			
 
				+        "gas_splitting": {
			
 
				+            "Total CO2 Emission (5.C Incineration and Open Burning of Waste)": "CO2",
			
 
				+            "Total CH4 Emission": f"CH4 ({gwp_to_use})",
			
 
				+            "Total N2O Emission": f"N2O ({gwp_to_use})",
			
 
				+            "Total Emission from Waste Sector": f"KYOTOGHG ({gwp_to_use})",
			
 
				+            "GHG Emission Sources and Sinks": "entity",
			
 
				+        },
			
 
				+        "unit": "ktCO2eq",
			
 
				+        "cat_codes_manual": {
			
 
				+            'Total CO2 Emission (5.C Incineration and Open Burning of Waste)': '5.C',
			
 
				+            'Total CH4 Emission': '5',
			
 
				+            'Total N2O Emission': '5',
			
 
				+            'Total Emission from Waste Sector': '5',
			
 
				+        },
			
 
				+    }, 
			
 
				+}
			
 
				+
			
 
				+table_defs_skip = {
			
 
				+    'ES2.1': { # 1990-2020 Greenhouse Gas Emissions and Sequestration in Taiwan by Type
			
 
				+        "tables": [0],
			
 
				+        "rows_to_fix": {
			
 
				+            0: { 
			
 
				+                3: ['CO2'],
			
 
				+            },
			
 
				+            1: {  # wherte col 0 is empty
			
 
				+                3: ['Net GHG Emission', 'Total GHG Emission'],
			
 
				+            },
			
 
				+        },
			
 
				+        "index_cols": ['GHG', 'GWP'],
			
 
				+        "wide_keyword": 'GHG',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        "unit": "ktCO2eq",
			
 
				+    },
			
 
				+    'ES2.5': { # 1990-2020 Fluoride-Containing Gas Emissions in Taiwan
			
 
				+        "tables": [6],
			
 
				+        "rows_to_fix": {
			
 
				+            0: {
			
 
				+                -2: ['Total SF6 Emissions', 
			
 
				+                     'Total NF3 Emissions'],
			
 
				+            },
			
 
				+        },
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'],
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, 
			
 
				+        #"entity": "CO2",
			
 
				+        "unit": "ktCO2eq",
			
 
				+    },
			
 
				+    'ES3.5': { # skip for now: 1990-2020 Changes in Carbon Sequestration by LULUCF Sector in Taiwan2],
			
 
				+        "tables": [12],
			
 
				+        "rows_to_fix": {}, 
			
 
				+        "index_cols": ['GHG Emission Sources and Sinks'], #header is merged col :-(
			
 
				+        "wide_keyword": 'GHG Emission Sources and Sinks',
			
 
				+        "col_wide_kwd": 0, # two column header
			
 
				+        "unit": "kt",
			
 
				+        "entity": "CO2",
			
 
				+    }, # need to consider the two columns specially (merge?)
			
 
				+}
			
--- a/code/UNFCCC_reader/Taiwan/read_TWN_2022-Inventory_from_pdf.py
+++ b/code/UNFCCC_reader/Taiwan/read_TWN_2022-Inventory_from_pdf.py
@@ -0,0 +1,404 @@
 
				+# this script reads data from Taiwan's 2022 national inventory
			
 
				+# Data is read from the english summary pdf
			
 
				+
			
 
				+import pandas as pd
			
 
				+import primap2 as pm2
			
 
				+from pathlib import Path
			
 
				+import camelot
			
 
				+import copy
			
 
				+#import re
			
 
				+
			
 
				+from primap2.pm2io._data_reading import matches_time_format
			
 
				+
			
 
				+from config_TWN_NIR2022 import table_defs, page_defs
			
 
				+from config_TWN_NIR2022 import fix_rows, make_wide_table
			
 
				+from config_TWN_NIR2022 import gwp_to_use
			
 
				+
			
 
				+# ###
			
 
				+# configuration
			
 
				+# ###
			
 
				+
			
 
				+root_path = Path(__file__).parents[3].absolute()
			
 
				+root_path = root_path.resolve()
			
 
				+downloaded_data_path = root_path / "downloaded_data"
			
 
				+extracted_data_path = root_path / "extracted_data"
			
 
				+
			
 
				+input_folder = downloaded_data_path / 'non-UNFCCC' / 'Taiwan'
			
 
				+# TODO: move file to subfolder
			
 
				+output_folder = extracted_data_path / 'non-UNFCCC' / 'Taiwan'
			
 
				+if not output_folder.exists():
			
 
				+    output_folder.mkdir()
			
 
				+
			
 
				+output_filename = 'TWN_inventory_2022_'
			
 
				+inventory_file = '00_abstract_en.pdf'
			
 
				+
			
 
				+cat_code_regexp = r'(?P<code>^[a-zA-Z0-9\.]{1,7})\s.*'
			
 
				+
			
 
				+time_format = "%Y"
			
 
				+
			
 
				+coords_cols = {
			
 
				+    "category": "category",
			
 
				+    "entity": "entity",
			
 
				+    "unit": "unit",
			
 
				+    # "area": "Geo_code",
			
 
				+}
			
 
				+
			
 
				+add_coords_cols = {
			
 
				+    #    "orig_cat_name": ["orig_cat_name", "category"],
			
 
				+}
			
 
				+
			
 
				+coords_terminologies = {
			
 
				+    "area": "ISO3",
			
 
				+    "category": "IPCC2006_1996_Taiwan_Inv",
			
 
				+    "scenario": "PRIMAP",
			
 
				+}
			
 
				+
			
 
				+coords_defaults = {
			
 
				+    "source": "TWN-GHG-Inventory",
			
 
				+    "provenance": "measured",
			
 
				+    "scenario": "2022NIR",
			
 
				+    "area": "TWN",
			
 
				+    # unit fill by table
			
 
				+}
			
 
				+
			
 
				+coords_value_mapping = {
			
 
				+    "unit": "PRIMAP1",
			
 
				+    "category": "PRIMAP1",
			
 
				+}
			
 
				+
			
 
				+coords_value_filling = {}
			
 
				+
			
 
				+#
			
 
				+filter_remove = {}
			
 
				+
			
 
				+filter_keep = {}
			
 
				+
			
 
				+meta_data = {
			
 
				+    "references": "https://unfccc.saveoursky.org.tw/nir/tw_nir_2022.php",
			
 
				+    "rights": "",
			
 
				+    "contact": "mail@johannes-guetschow.de",
			
 
				+    "title": "2022 Republic of China - National Greenhouse Gas Report",
			
 
				+    "comment": "Read fom pdf file and converted to PRIMAP2 format by Johannes Gütschow",
			
 
				+    "institution": "Republic of China - Environmental Protection Administration",
			
 
				+}
			
 
				+
			
 
				+# config for part3: mapping to 2006 categpries
			
 
				+
			
 
				+cat_mapping = {
			
 
				+    '3': 'M.AG',
			
 
				+    '3.A': '3.A.1',
			
 
				+    '3.B': '3.A.2',
			
 
				+    '3.C': '3.C.7',
			
 
				+    '3.D': 'M.3.AS',
			
 
				+    '3.F': '3.C.1.b',
			
 
				+    '3.H': '3.C.3',
			
 
				+    '4': 'M.LULUCF',
			
 
				+    '5': '4',
			
 
				+    '5.A': '4.A',
			
 
				+    '5.B': '4.B',
			
 
				+    '5.C': '4.C',
			
 
				+    '5.D': '4.D',
			
 
				+    '5.D.1': '4.D.1',
			
 
				+    '5.D.2': '4.D.2',
			
 
				+}
			
 
				+
			
 
				+aggregate_cats = {
			
 
				+    '1.A': {'sources': ['1.A.1', '1.A.2', '1.A.3', '1.A.4'],
			
 
				+            'name': 'Fuel Combustion Activities'},
			
 
				+    '1.B': {'sources': ['1.B.1', '1.B.2'], 'name': 'Fugitive Emissions from Fuels'},
			
 
				+    '3.A': {'sources': ['3.A.1', '3.A.2'], 'name': 'Livestock'},
			
 
				+    '3.C.1': {'sources': ['3.C.1.b'], 'name': 'Emissions from Biomass Burning'},
			
 
				+    '3.C.5': {'sources': ['3.C.5.a', '3.C.5.b'],
			
 
				+              'name': 'Indirect N2O Emissions from Managed Soils'},
			
 
				+    '3.C': {'sources': ['3.C.1', '3.C.3', 'M.3.AS', '3.C.7'],
			
 
				+            'name': 'Aggregate sources and non-CO2 emissions sources on land'},
			
 
				+    '3': {'sources': ['M.AG', 'M.LULUCF'], 'name': 'AFOLU'},
			
 
				+    'M.AG.ELV': {'sources': ['3.C'],
			
 
				+                 'name': 'Agriculture excluding livestock emissions'},
			
 
				+}
			
 
				+
			
 
				+# 2 for NF3, PFCs (from 2.E)
			
 
				+aggregate_cats_NF3_PFC = {
			
 
				+    '2': {'sources': ['2.E'], 'name': 'Industrial Process and Product Use Sector'},
			
 
				+}
			
 
				+
			
 
				+compression = dict(zlib=True, complevel=9)
			
 
				+
			
 
				+# ###
			
 
				+# read the tables from pdf
			
 
				+# ###
			
 
				+
			
 
				+all_tables = []
			
 
				+for page in page_defs:
			
 
				+    print(f"Reading from page {page}")
			
 
				+    new_tables = camelot.read_pdf(
			
 
				+        str(input_folder / inventory_file),
			
 
				+        pages=page,
			
 
				+        **page_defs[page],
			
 
				+        )
			
 
				+    for table in new_tables:
			
 
				+        all_tables.append(table.df)
			
 
				+
			
 
				+
			
 
				+# ###
			
 
				+# convert tables to primap2 format
			
 
				+# ###
			
 
				+data_pm2 = None
			
 
				+for table_name in table_defs.keys():
			
 
				+    print(f"Working on table: {table_name}")
			
 
				+
			
 
				+    table_def = copy.deepcopy(table_defs[table_name])
			
 
				+    # combine all raw tables
			
 
				+    df_this_table = all_tables[table_def["tables"][0]].copy(deep=True)
			
 
				+    if len(table_def["tables"]) > 1:
			
 
				+        for table in table_def["tables"][1:]:
			
 
				+            df_this_table = pd.concat(
			
 
				+                [df_this_table, all_tables[table]],
			
 
				+                axis=0,
			
 
				+                join='outer')
			
 
				+
			
 
				+    # fix for table ES3.6
			
 
				+    if table_name == 'ES3.6':
			
 
				+        col_idx = df_this_table[0] == "Total CO Emission"
			
 
				+        df_this_table.loc[col_idx, 1:] = ''
			
 
				+        df_this_table.loc[col_idx, 0] = 'Total CO2 Emission'
			
 
				+
			
 
				+    df_this_table = df_this_table.reset_index(drop=True)
			
 
				+
			
 
				+    # fix categories if necessary
			
 
				+    if "fix_cats" in table_def.keys():
			
 
				+        for col in table_def["fix_cats"]:
			
 
				+            df_this_table[col] = df_this_table[col].replace(table_def["fix_cats"][col])
			
 
				+
			
 
				+    # fix rows
			
 
				+    for col in table_def["rows_to_fix"].keys():
			
 
				+        for n_rows in table_def["rows_to_fix"][col].keys():
			
 
				+            print(f"Fixing {col}, {n_rows}")
			
 
				+            # replace line breaks, long hyphens, double, and triple spaces in category names
			
 
				+            df_this_table.iloc[:, 0] = df_this_table.iloc[:, 0].str.replace("\n", " ")
			
 
				+            df_this_table.iloc[:, 0] = df_this_table.iloc[:, 0].str.replace("   ", " ")
			
 
				+            df_this_table.iloc[:, 0] = df_this_table.iloc[:, 0].str.replace("  ", " ")
			
 
				+            df_this_table.iloc[:, 0] = df_this_table.iloc[:, 0].str.replace("–", "-")
			
 
				+            df_this_table = fix_rows(df_this_table,
			
 
				+                                     table_def["rows_to_fix"][col][n_rows], col, n_rows)
			
 
				+
			
 
				+    # split by entity
			
 
				+    if "gas_splitting" in table_def.keys():
			
 
				+        col_entity = [''] * len(df_this_table)
			
 
				+        last_entity = ''
			
 
				+        for i in range(0, len(df_this_table)):
			
 
				+            current_header = df_this_table[table_def["col_wide_kwd"]].iloc[i]
			
 
				+            if current_header in table_def["gas_splitting"].keys():
			
 
				+                last_entity = table_def["gas_splitting"][current_header]
			
 
				+            col_entity[i] = last_entity
			
 
				+
			
 
				+        df_this_table["entity"] = col_entity
			
 
				+        table_def["index_cols"].append("entity")
			
 
				+
			
 
				+    # make a wide table
			
 
				+    df_this_table = make_wide_table(df_this_table, table_def["wide_keyword"],
			
 
				+                                    table_def["col_wide_kwd"], table_def["index_cols"])
			
 
				+
			
 
				+    if "drop_rows" in table_def.keys():
			
 
				+        df_this_table = df_this_table.drop(table_def["drop_rows"], axis=0)
			
 
				+
			
 
				+    # reset row index
			
 
				+    df_this_table = df_this_table.reset_index(drop=False)
			
 
				+
			
 
				+    # add entity
			
 
				+    if "entity" in table_def.keys():
			
 
				+        df_this_table["entity"] = table_def["entity"]
			
 
				+
			
 
				+    # add unit
			
 
				+    df_this_table["unit"] = table_def["unit"]
			
 
				+
			
 
				+    df_this_table = df_this_table.rename({table_def["index_cols"][0]: "orig_cat_name"},
			
 
				+                                         axis=1)
			
 
				+
			
 
				+    # print(table_def["index_cols"][0])
			
 
				+    # print(df_this_table.columns.values)
			
 
				+
			
 
				+    # make a copy of the categories row
			
 
				+    df_this_table["category"] = df_this_table["orig_cat_name"]
			
 
				+
			
 
				+    # replace cat names by codes in col "category"
			
 
				+    # first the manual replacements
			
 
				+    df_this_table["category"] = df_this_table["category"].replace(
			
 
				+        table_def["cat_codes_manual"])
			
 
				+    # then the regex replacements
			
 
				+    repl = lambda m: m.group('code')
			
 
				+    df_this_table["category"] = df_this_table["category"].str.replace(cat_code_regexp,
			
 
				+                                                                      repl, regex=True)
			
 
				+
			
 
				+    ### convert to PRIMAP2 IF
			
 
				+    # remove ','
			
 
				+    time_format = '%Y'
			
 
				+    time_columns = [
			
 
				+        col
			
 
				+        for col in df_this_table.columns.values
			
 
				+        if matches_time_format(col, time_format)
			
 
				+    ]
			
 
				+
			
 
				+    for col in time_columns:
			
 
				+        df_this_table.loc[:, col] = df_this_table.loc[:, col].str.replace(',', '',
			
 
				+                                                                          regex=False)
			
 
				+
			
 
				+    # drop orig_cat_name as it's not unique per category
			
 
				+    df_this_table = df_this_table.drop(columns="orig_cat_name")
			
 
				+
			
 
				+    # coords_defaults_this_table = coords_defaults.copy()
			
 
				+    # coords_defaults_this_table["unit"] = table_def["unit"]
			
 
				+    df_this_table_if = pm2.pm2io.convert_wide_dataframe_if(
			
 
				+        df_this_table,
			
 
				+        coords_cols=coords_cols,
			
 
				+        add_coords_cols=add_coords_cols,
			
 
				+        coords_defaults=coords_defaults,
			
 
				+        coords_terminologies=coords_terminologies,
			
 
				+        coords_value_mapping=coords_value_mapping,
			
 
				+        # coords_value_filling=coords_value_filling,
			
 
				+        # filter_remove=filter_remove,
			
 
				+        # filter_keep=filter_keep,
			
 
				+        meta_data=meta_data
			
 
				+    )
			
 
				+
			
 
				+    this_table_pm2 = pm2.pm2io.from_interchange_format(df_this_table_if)
			
 
				+
			
 
				+    if data_pm2 is None:
			
 
				+        data_pm2 = this_table_pm2
			
 
				+    else:
			
 
				+        data_pm2 = data_pm2.pr.merge(this_table_pm2)
			
 
				+
			
 
				+# convert back to IF to have units in the fixed format
			
 
				+data_if = data_pm2.pr.to_interchange_format()
			
 
				+
			
 
				+
			
 
				+# ###
			
 
				+# convert to IPCC2006 categories
			
 
				+# ###
			
 
				+data_if_2006 = data_if.copy(deep=True)
			
 
				+data_if_2006
			
 
				+# filter_data(data_if_2006, filter_remove=filter_remove_IPCC2006)
			
 
				+data_if_2006 = data_if_2006.replace(
			
 
				+    {'category (IPCC2006_1996_Taiwan_Inv)': cat_mapping})
			
 
				+
			
 
				+# rename the category col
			
 
				+data_if_2006.rename(
			
 
				+    columns={'category (IPCC2006_1996_Taiwan_Inv)': 'category (IPCC2006_PRIMAP)'},
			
 
				+    inplace=True)
			
 
				+data_if_2006.attrs['attrs']['cat'] = 'category (IPCC2006_PRIMAP)'
			
 
				+data_if_2006.attrs['dimensions']['*'] = [
			
 
				+    'category (IPCC2006_PRIMAP)' if item == 'category (IPCC2006_1996_Taiwan_Inv)'
			
 
				+    else item for item in data_if_2006.attrs['dimensions']['*']]
			
 
				+
			
 
				+# aggregate categories
			
 
				+for cat_to_agg in aggregate_cats:
			
 
				+    mask = data_if_2006["category (IPCC2006_PRIMAP)"].isin(
			
 
				+        aggregate_cats[cat_to_agg]["sources"])
			
 
				+    df_test = data_if_2006[mask]
			
 
				+
			
 
				+    if len(df_test) > 0:
			
 
				+        print(f"Aggregating category {cat_to_agg}")
			
 
				+        df_combine = df_test.copy(deep=True)
			
 
				+
			
 
				+        time_format = '%Y'
			
 
				+        time_columns = [
			
 
				+            col
			
 
				+            for col in df_combine.columns.values
			
 
				+            if matches_time_format(col, time_format)
			
 
				+        ]
			
 
				+
			
 
				+        for col in time_columns:
			
 
				+            df_combine[col] = pd.to_numeric(df_combine[col], errors="coerce")
			
 
				+
			
 
				+        df_combine = df_combine.groupby(
			
 
				+            by=['source', 'scenario (PRIMAP)', 'provenance', 'area (ISO3)', 'entity',
			
 
				+                'unit']).sum()
			
 
				+
			
 
				+        df_combine.insert(0, "category (IPCC2006_PRIMAP)", cat_to_agg)
			
 
				+        # df_combine.insert(1, "cat_name_translation", aggregate_cats[cat_to_agg]["name"])
			
 
				+        # df_combine.insert(2, "orig_cat_name", "computed")
			
 
				+
			
 
				+        df_combine = df_combine.reset_index()
			
 
				+
			
 
				+        data_if_2006 = data_if_2006.append(df_combine)
			
 
				+        data_if_2006 = data_if_2006.reset_index(drop=True)
			
 
				+    else:
			
 
				+        print(f"no data to aggregate category {cat_to_agg}")
			
 
				+
			
 
				+# aggregate categories
			
 
				+for cat_to_agg in aggregate_cats_NF3_PFC:
			
 
				+    mask = data_if_2006["category (IPCC2006_PRIMAP)"].isin(
			
 
				+        aggregate_cats_NF3_PFC[cat_to_agg]["sources"])
			
 
				+    mask_gas = data_if_2006["entity"].isin(
			
 
				+        [f"NF3 ({gwp_to_use})", f"PFCs ({gwp_to_use})"])
			
 
				+    df_test = data_if_2006[mask & mask_gas]
			
 
				+
			
 
				+    if len(df_test) > 0:
			
 
				+        print(f"Aggregating category {cat_to_agg}")
			
 
				+        df_combine = df_test.copy(deep=True)
			
 
				+
			
 
				+        time_format = '%Y'
			
 
				+        time_columns = [
			
 
				+            col
			
 
				+            for col in df_combine.columns.values
			
 
				+            if matches_time_format(col, time_format)
			
 
				+        ]
			
 
				+
			
 
				+        for col in time_columns:
			
 
				+            df_combine[col] = pd.to_numeric(df_combine[col], errors="coerce")
			
 
				+
			
 
				+        df_combine = df_combine.groupby(
			
 
				+            by=['source', 'scenario (PRIMAP)', 'provenance', 'area (ISO3)', 'entity',
			
 
				+                'unit']).sum()
			
 
				+
			
 
				+        df_combine.insert(0, "category (IPCC2006_PRIMAP)", cat_to_agg)
			
 
				+        # df_combine.insert(1, "cat_name_translation", aggregate_cats[cat_to_agg]["name"])
			
 
				+        # df_combine.insert(2, "orig_cat_name", "computed")
			
 
				+
			
 
				+        df_combine = df_combine.reset_index()
			
 
				+
			
 
				+        data_if_2006 = data_if_2006.append(df_combine)
			
 
				+        data_if_2006 = data_if_2006.reset_index(drop=True)
			
 
				+    else:
			
 
				+        print(f"no data to aggregate category {cat_to_agg}")
			
 
				+
			
 
				+# conversion to PRIMAP2 native format
			
 
				+data_pm2_2006 = pm2.pm2io.from_interchange_format(data_if_2006)
			
 
				+
			
 
				+# convert to mass units from CO2eq
			
 
				+entities_to_convert = ['N2O', 'SF6', 'CH4', 'NF3']
			
 
				+entities_to_convert = [f"{entity} ({gwp_to_use})" for entity in entities_to_convert]
			
 
				+
			
 
				+for entity in entities_to_convert:
			
 
				+    converted = data_pm2_2006[entity].pr.convert_to_mass()
			
 
				+    basic_entity = entity.split(" ")[0]
			
 
				+    converted = converted.to_dataset(name=basic_entity)
			
 
				+    data_pm2_2006 = data_pm2_2006.pr.merge(converted)
			
 
				+    data_pm2_2006[basic_entity].attrs["entity"] = basic_entity
			
 
				+
			
 
				+# drop the GWP data
			
 
				+data_pm2_2006 = data_pm2_2006.drop_vars(entities_to_convert)
			
 
				+
			
 
				+# convert to IF
			
 
				+data_if_2006 = data_pm2_2006.pr.to_interchange_format()
			
 
				+
			
 
				+# ###
			
 
				+# save data
			
 
				+# ###
			
 
				+# data in original categories
			
 
				+pm2.pm2io.write_interchange_format(output_folder /
			
 
				+                                   (output_filename + coords_terminologies["category"]),
			
 
				+                                   data_if)
			
 
				+encoding = {var: compression for var in data_pm2.data_vars}
			
 
				+data_pm2.pr.to_netcdf((output_folder /
			
 
				+                      (output_filename + coords_terminologies[
			
 
				+                          "category"])).with_suffix(".nc"),
			
 
				+                      encoding=encoding)
			
 
				+
			
 
				+# data in 2006 categories
			
 
				+pm2.pm2io.write_interchange_format(output_folder /
			
 
				+                                   (output_filename + "IPCC2006_PRIMAP"), data_if_2006)
			
 
				+encoding = {var: compression for var in data_pm2_2006.data_vars}
			
 
				+data_pm2_2006.pr.to_netcdf((output_folder /
			
 
				+                            (output_filename + "IPCC2006_PRIMAP")).with_suffix(".nc"),
			
 
				+                           encoding=encoding)
			
--- a/code/UNFCCC_reader/folder_mapping.json
+++ b/code/UNFCCC_reader/folder_mapping.json
@@ -1,5 +1,6 @@
 
				 {
			
 
				     "KOR": "Republic_of_Korea",
			
 
				+    "TWN": "Taiwan",
			
 
				     "ARG": "Argentina",
			
 
				     "MAR": "Morocco",
			
 
				     "COL": "Colombia",
			
--- a/code/UNFCCC_reader/get_submissions_info.py
+++ b/code/UNFCCC_reader/get_submissions_info.py
@@ -38,6 +38,7 @@ custom_folders = {
 
				     'Côte_d’Ivoire': 'CIV',
			
 
				     'Democratic_Republic_of_the_Congo': "COD",
			
 
				     'European_Union': 'EUA',
			
 
				+    'Taiwan': 'TWN',
			
 
				 }
			
 
				 
			
 
				 def get_country_submissions(
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.csv
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.csv
@@ -0,0 +1 @@
 
				+../../../.git/annex/objects/g4/GV/MD5E-s22032--3407c653c56f1d5f6868540cf3bbe015.csv/MD5E-s22032--3407c653c56f1d5f6868540cf3bbe015.csv
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.nc
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.nc
@@ -0,0 +1 @@
 
				+../../../.git/annex/objects/9P/3v/MD5E-s88105--c38e00d205d11f92bfe4f6b63f371db4.nc/MD5E-s88105--c38e00d205d11f92bfe4f6b63f371db4.nc
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.yaml
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.yaml
@@ -0,0 +1,85 @@
 
				+attrs:
			
 
				+  references: https://unfccc.saveoursky.org.tw/nir/tw_nir_2022.php
			
 
				+  rights: ''
			
 
				+  contact: mail@johannes-guetschow.de
			
 
				+  title: 2022 Republic of China - National Greenhouse Gas Report
			
 
				+  comment: Read fom pdf file and converted to PRIMAP2 format by Johannes Gütschow
			
 
				+  institution: Republic of China - Environmental Protection Administration
			
 
				+  cat: category (IPCC2006_PRIMAP)
			
 
				+  scen: scenario (PRIMAP)
			
 
				+  area: area (ISO3)
			
 
				+time_format: '%Y'
			
 
				+dimensions:
			
 
				+  CH4 (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  CO2:
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  HFCS (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  KYOTOGHG (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  N2O (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  NF3 (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  PFCS (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+  SF6 (AR4GWP100):
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+data_file: TWN_inventory_2022_IPCC2006_1996_Taiwan_Inv.csv
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.csv
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.csv
@@ -0,0 +1 @@
 
				+../../../.git/annex/objects/ff/j4/MD5E-s41440--a7b4cf42f9d2ad138fffd9f5bac34000.csv/MD5E-s41440--a7b4cf42f9d2ad138fffd9f5bac34000.csv
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.nc
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.nc
@@ -0,0 +1 @@
 
				+../../../.git/annex/objects/QX/QG/MD5E-s90488--f34d3de12798c22085d9b16f40c0ba10.nc/MD5E-s90488--f34d3de12798c22085d9b16f40c0ba10.nc
			
--- a/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.yaml
+++ b/extracted_data/non-UNFCCC/Taiwan/TWN_inventory_2022_IPCC2006_PRIMAP.yaml
@@ -0,0 +1,22 @@
 
				+attrs:
			
 
				+  references: https://unfccc.saveoursky.org.tw/nir/tw_nir_2022.php
			
 
				+  rights: ''
			
 
				+  contact: mail@johannes-guetschow.de
			
 
				+  title: 2022 Republic of China - National Greenhouse Gas Report
			
 
				+  comment: Read fom pdf file and converted to PRIMAP2 format by Johannes Gütschow
			
 
				+  institution: Republic of China - Environmental Protection Administration
			
 
				+  cat: category (IPCC2006_PRIMAP)
			
 
				+  scen: scenario (PRIMAP)
			
 
				+  area: area (ISO3)
			
 
				+time_format: '%Y'
			
 
				+dimensions:
			
 
				+  '*':
			
 
				+  - time
			
 
				+  - category (IPCC2006_PRIMAP)
			
 
				+  - area (ISO3)
			
 
				+  - provenance
			
 
				+  - source
			
 
				+  - scenario (PRIMAP)
			
 
				+  - entity
			
 
				+  - unit
			
 
				+data_file: TWN_inventory_2022_IPCC2006_PRIMAP.csv
		`@@ -0,0 +1 @@`
		`+../../../.git/annex/objects/g4/GV/MD5E-s22032--3407c653c56f1d5f6868540cf3bbe015.csv/MD5E-s22032--3407c653c56f1d5f6868540cf3bbe015.csv`
		`@@ -0,0 +1 @@`
		`+../../../.git/annex/objects/9P/3v/MD5E-s88105--c38e00d205d11f92bfe4f6b63f371db4.nc/MD5E-s88105--c38e00d205d11f92bfe4f6b63f371db4.nc`
		`@@ -0,0 +1 @@`
		`+../../../.git/annex/objects/ff/j4/MD5E-s41440--a7b4cf42f9d2ad138fffd9f5bac34000.csv/MD5E-s41440--a7b4cf42f9d2ad138fffd9f5bac34000.csv`
		`@@ -0,0 +1 @@`
		`+../../../.git/annex/objects/QX/QG/MD5E-s90488--f34d3de12798c22085d9b16f40c0ba10.nc/MD5E-s90488--f34d3de12798c22085d9b16f40c0ba10.nc`