NETL-RIC
diff --git a/‎README.md
Lines changed: 3 additions & 0 deletions b/‎README.md
Lines changed: 3 additions & 0 deletions
diff --git a/‎electricitylci/__init__.py
Lines changed: 13 additions & 11 deletions b/‎electricitylci/__init__.py
Lines changed: 13 additions & 11 deletions
diff --git a/‎electricitylci/coal_upstream.py
Lines changed: 56 additions & 38 deletions b/‎electricitylci/coal_upstream.py
Lines changed: 56 additions & 38 deletions
@@ -60,3 +60,6 @@ EWI`
     * Successfully installs:
         + mpmath-1.3.0
         + sympy-1.12
++ `pip install scipy`
+    * Successfully installs:
+        + scipy-1.11.1
@@ -49,7 +49,7 @@ def get_generation_process_df(regions=None, **kwargs):
         import electricitylci.plant_water_use as water
         water_df = water.generate_plant_water_use(config.model_specs.eia_gen_year)
         generation_process_df=concat_clean_upstream_and_plant(generation_process_df,water_df)
-    
+
     if config.model_specs.include_upstream_processes is True:
         try:
             upstream_df = kwargs['upstream_df']
@@ -99,11 +99,11 @@ def get_generation_mix_process_df(regions=None):
     """
     Create a dataframe of generation mixes by fuel type in each subregion.
 
-    This function imports and uses the parameter 'replace_egrid' and 
+    This function imports and uses the parameter 'replace_egrid' and
     'gen_mix_from_model_generation_data' from model_config.py. If 'replace_egrid'
-    is true or the specified 'regions' is true, then the generation mix will 
+    is true or the specified 'regions' is true, then the generation mix will
     come from EIA 923 data. If 'replace_egrid' is false then the generation
-    mix will either come from the eGRID reference data 
+    mix will either come from the eGRID reference data
     ('gen_mix_from_model_generation_data' is false) or from the generation data
     from this model ('gen_mix_from_model_generation_data' is true).
 
@@ -130,7 +130,7 @@ def get_generation_mix_process_df(regions=None):
         create_generation_mix_process_df_from_model_generation_data,
     )
     from electricitylci.eia923_generation import build_generation_data
-    
+
     if regions is None:
         regions = config.model_specs.regional_aggregation
 
@@ -277,9 +277,11 @@ def write_process_dicts_to_jsonld(*process_dicts):
 
     """
     from electricitylci.olca_jsonld_writer import write
-    
+
     all_process_dicts = dict()
     for d in process_dicts:
+        # Append dictionaries together using double asterisk syntax
+        # (see about dictionary interaction with ** syntax)
         all_process_dicts = {**all_process_dicts, **d}
     olca_dicts = write(all_process_dicts, config.model_specs.namestr)
     return olca_dicts
@@ -297,7 +299,7 @@ def get_upstream_process_df(eia_gen_year):
     import electricitylci.nuclear_upstream as nuke
     import electricitylci.power_plant_construction as const
     from electricitylci.combinator import concat_map_upstream_databases
-    
+
     logger.info("Generating upstream inventories...")
     coal_df = coal.generate_upstream_coal(eia_gen_year)
     ng_df = ng.generate_upstream_ng(eia_gen_year)
@@ -376,9 +378,9 @@ def combine_upstream_and_gen_df(gen_df, upstream_df):
 
 def get_gen_plus_netl():
     """
-    This will combine the netl life cycle data for solar, solar thermal, 
+    This will combine the netl life cycle data for solar, solar thermal,
     geothermal, wind, and hydro and will include impacts from construction, etc.
-    that would be omitted from the regular sources of emissions. 
+    that would be omitted from the regular sources of emissions.
     It then generates power plant emissions. The two different dataframes are
     combined to provide a single dataframe representing annual emissions or
     life cycle emissions apportioned over the appropriate number of years for
@@ -398,7 +400,7 @@ def get_gen_plus_netl():
     import electricitylci.wind_upstream as wind
     import electricitylci.hydro_upstream as hydro
     import electricitylci.solar_thermal_upstream as solartherm
-    
+
     eia_gen_year = config.model_specs.eia_gen_year
     logger.info(
         "Generating inventories for geothermal, solar, wind, hydro, and solar thermal..."
@@ -511,7 +513,7 @@ def write_gen_fuel_database_to_dict(
     #of dictionaries for other levels of aggregation. This logic will need to
     #be implemented in main.py so that FERC consumption mixes can be made
     #using the required BA aggregation.
-    # if subregion in ["BA","FERC","US"]:    
+    # if subregion in ["BA","FERC","US"]:
     #     subregion="BA"
     logger.info("Converting generator dataframe to dictionaries...")
     gen_plus_fuel_dict = olcaschema_genprocess(
 
@@ -1,23 +1,31 @@
 #!/usr/bin/python
 # -*- coding: utf-8 -*-
-if __name__=='__main__':
-    import electricitylci.model_config as config
-    config.model_specs = config.build_model_class()
+#
+# coal_upstream.py
+#
+##############################################################################
+# REQUIRED MODULES
+##############################################################################
+import logging
+import os
+from os.path import join
 
+import numpy as np
 import pandas as pd
-import regex
-from sqlalchemy import false
-from electricitylci.globals import paths, data_dir, output_dir
+import requests
+
+from electricitylci.globals import paths
+from electricitylci.globals import data_dir
+from electricitylci.globals import output_dir
 from electricitylci.eia923_generation import eia923_download
-import os
-from os.path import join
 from electricitylci.utils import find_file_in_folder
-import requests
 import electricitylci.PhysicalQuantities as pq
-import numpy as np
-import logging
-logger = logging.getLogger("coal_upstream")
 
+
+##############################################################################
+# GLOBALS
+##############################################################################
+logger = logging.getLogger("coal_upstream")
 coal_type_codes={'BIT': 'B',
                  'LIG': 'L',
                  'SUB': 'S',
@@ -46,6 +54,9 @@
                 'Avg Truck Ton*Miles': 'Truck'}
 
 
+##############################################################################
+# FUNCTIONS
+##############################################################################
 def eia_7a_download(year, save_path):
     eia7a_base_url = 'http://www.eia.gov/coal/data/public/xls/'
     name = 'coalpublic{}.xls'.format(year)
@@ -99,7 +110,7 @@ def read_eia923_fuel_receipts(year):
                     if '.csv' in f
                     and '_page_5_reduced.csv' in f]
         if csv_file:
-            csv_path = os.path.join(expected_923_folder, csv_file[0])
+            csv_path = join(expected_923_folder, csv_file[0])
             eia_fuel_receipts_df=pd.read_csv(csv_path, low_memory=False)
         else:
             eia923_path, eia923_name = find_file_in_folder(
@@ -392,66 +403,66 @@ def wtd_mean(pdser, total_db):
             right_on=["Coal Code"],
             how="left"
             )
-    
+
     coal_mining_inventory_df = pd.concat([existing_scens_merge,missing_scens_merge],sort=False).reset_index(drop=True)
-    
-    
-    # Multiply coal mining emission factor by coal quantity; 
+
+
+    # Multiply coal mining emission factor by coal quantity;
     # convert to kg - coal input in tons (US)
     coal_mining_inventory_df["FlowAmount"] = (
             pq.convert(1,'ton','kg')*
             coal_mining_inventory_df["p50"].multiply(
                     coal_mining_inventory_df['quantity'],axis = "index")
             )
-    
+
     coal_mining_inventory_df["Source"]="Mining"
     coal_mining_inventory_df=coal_mining_inventory_df[["plant_id","coal_source_code","quantity","FlowName","FlowAmount","Compartment","input","Source","FlowUUID","ElementaryFlowPrimeContext","Unit","FlowType"]]
     # Keep the plant ID and air emissions columns
 #    merged_input_eia_coal_a = merged_input_eia_coal_a[
 #            ['plant_id','coal_source_code','quantity'] + column_air_emission]
-    
-    # Groupby the plant ID since some plants have multiple row entries 
+
+    # Groupby the plant ID since some plants have multiple row entries
     # (receive coal from multiple basins)
 #    merged_input_eia_coal_grouped = (
 #            merged_input_eia_coal_a.groupby(
 #                    by=['plant_id','coal_source_code'],
 #                    as_index=False)[['quantity',"FlowAmount"]].sum())
 #    merged_input_eia_coal_grouped = merged_input_eia_coal_a.reset_index(drop=True)
-    
+
     # Melting the database on Plant ID
 #    melted_database_air = merged_input_eia_coal_a.melt(
-#            id_vars = ['plant_id','coal_source_code','quantity'], 
-#            var_name = 'FlowName', 
+#            id_vars = ['plant_id','coal_source_code','quantity'],
+#            var_name = 'FlowName',
 #            value_name = 'FlowAmount')
-    
-    
-    # Repeat the same methods for emissions from transportation 
+
+
+    # Repeat the same methods for emissions from transportation
     coal_transportation = coal_transportation.melt(
             'Plant Government ID',var_name = 'Transport')
     coal_transportation["value"]=coal_transportation["value"]*pq.convert(1,"ton","kg")*pq.convert(1,"mi","km")
     merged_transport_coal = coal_transportation.merge(
-            coal_inventory_transportation, 
-            left_on = ['Transport'], 
+            coal_inventory_transportation,
+            left_on = ['Transport'],
             right_on =['Modes'],
             how = 'left')
-    
+
     # multiply transportation emission factor (kg/kg-mi) by total transportation
     # (ton-miles)
     column_air_emission=[x for x in coal_inventory_transportation.columns[1:] if "Unnamed" not in x]
     merged_transport_coal[column_air_emission] = (
             # pq.convert(1,'ton','kg')*
             merged_transport_coal[column_air_emission].multiply(
                     merged_transport_coal['value'],axis = "index"))
-    
+
     merged_transport_coal.rename(columns={'Plant Government ID':'plant_id'},
                                  inplace=True)
-    
-    # Groupby the plant ID since some plants have multiple row entries 
+
+    # Groupby the plant ID since some plants have multiple row entries
     # (receive coal from multiple basins)
     merged_transport_coal= merged_transport_coal.groupby(
             ['plant_id','Transport'])[['value']+column_air_emission].sum()
     merged_transport_coal= merged_transport_coal.reset_index()
-    
+
     # Keep the plant ID and emissions columns
     merged_transport_coal = (
             merged_transport_coal[
@@ -461,13 +472,13 @@ def wtd_mean(pdser, total_db):
                                  inplace=True)
     # Melting the database on Plant ID
     melted_database_transport = merged_transport_coal.melt(
-            id_vars = ['plant_id','coal_source_code','quantity'], 
-            var_name = 'FlowName', 
+            id_vars = ['plant_id','coal_source_code','quantity'],
+            var_name = 'FlowName',
             value_name = 'FlowAmount')
     melted_database_transport['coal_source_code']=melted_database_transport.apply(
             _transport_code,axis=1)
-    # Adding to new columns for the compartment (water) and 
-    # The source of the emissisons (mining). 
+    # Adding to new columns for the compartment (water) and
+    # The source of the emissisons (mining).
     melted_database_transport['Compartment'] = 'emission/air'
     melted_database_transport['Source'] = 'Transportation'
     melted_database_transport["ElementaryFlowPrimeContext"]="emission"
@@ -489,7 +500,7 @@ def wtd_mean(pdser, total_db):
             inplace=True
             )
     melted_database_transport["input"]=False
-    merged_coal_upstream = pd.concat([coal_mining_inventory_df, 
+    merged_coal_upstream = pd.concat([coal_mining_inventory_df,
                                       melted_database_transport],sort=False).reset_index(drop=True)
     merged_coal_upstream['FuelCategory']='COAL'
     merged_coal_upstream.rename(columns={
@@ -506,7 +517,14 @@ def wtd_mean(pdser, total_db):
     merged_coal_upstream["Source"]="netl"
     return merged_coal_upstream
 
+
+##############################################################################
+# MAIN
+##############################################################################
 if __name__=='__main__':
+    import electricitylci.model_config as config
+    config.model_specs = config.build_model_class()
+
     year=2020
     df = generate_upstream_coal(year)
     df.to_csv(output_dir+'/coal_emissions_{}.csv'.format(year))