diff --git a/scripts/us_epa/ghgrp/download.py b/scripts/us_epa/ghgrp/download.py index 57b4c02531..ab8e774814 100644 --- a/scripts/us_epa/ghgrp/download.py +++ b/scripts/us_epa/ghgrp/download.py @@ -15,119 +15,274 @@ # TODO(beets): Add tests import io +from absl import logging import os import ssl - -import pandas as pd +import re import requests +from datetime import datetime +import pandas as pd import zipfile +from retry import retry + +logging.set_verbosity(logging.INFO) -DOWNLOAD_URI = 'https://www.epa.gov/sites/default/files/2020-11/2019_data_summary_spreadsheets.zip' +# URL templates +download_url = 'https://www.epa.gov/system/files/other-files/{year}-10/{year_minus_1}_data_summary_spreadsheets.zip' +crosswalk_url = 'https://www.epa.gov/system/files/documents/{yr}-04/ghgrp_oris_power_plant_crosswalk_12_13_21.xlsx' + +# Constants YEAR_DATA_FILENAME = 'ghgp_data_{year}.xlsx' HEADER_ROW = 3 -CROSSWALK_URI = 'https://www.epa.gov/sites/default/files/2020-12/ghgrp_oris_power_plant_crosswalk_11_24_20.xlsx' CROSSWALK_COLS_TO_KEEP = [ 'GHGRP Facility ID', 'ORIS CODE', 'ORIS CODE 2', 'ORIS CODE 3', 'ORIS CODE 4', 'ORIS CODE 5' ] GHGRP_ID_COL = 'Facility Id' -_DIRECT_EMITTERS_SHEET = 'Direct Emitters' +_DIRECT_EMITTERS_SHEET = r"^Direct.*Emitters$" + SHEET_NAMES_TO_CSV_FILENAMES = { - _DIRECT_EMITTERS_SHEET: 'direct_emitters.csv', 'Onshore Oil & Gas Prod.': 'oil_and_gas.csv', 'Gathering & Boosting': 'gathering_and_boosting.csv', 'LDC - Direct Emissions': 'local_distribution.csv', 'SF6 from Elec. Equip.': 'elec_equip.csv', - # Needs schema: - # - 'Transmission Pipelines', - # The following sheets are skipped due to sparse data: - # - 'Suppliers', - # - 'CO2 Injection', - # - 'Geologic Sequestration of CO2', } +def get_csv_filename(sheet_name): + """ + Determines the CSV filename for a given sheet name. + Sheets matching the DIRECT_EMITTERS_PATTERN are saved as 'direct_emitters.csv'. + + Args: + sheet_name (str): Name of the Excel sheet to map to a CSV filename. + + Returns: + str: The corresponding CSV filename or None if no match is found. + """ + try: + if re.match(_DIRECT_EMITTERS_SHEET, sheet_name): + return 'direct_emitters.csv' + return SHEET_NAMES_TO_CSV_FILENAMES.get(sheet_name) + except Exception as e: + logging.fatal( + f"Error occured while mapping the sheet Direct Emitters: {e}") + + class Downloader: """ - The following must be called in order. Earlier steps can be skipped if it has successfully completed in a previous run. - - download_data - - extract_all_years - - save_all_crosswalks + Handles downloading, extracting, and processing data files. """ - def __init__(self, save_path): - self.years = list(range(2010, 2020)) + def __init__(self, save_path, url_year): + self.years = list(range(2010, url_year - 1)) self.current_year = None self.files = [] # list of (year, filename) of all extracted files self.save_path = save_path - def download_data(self): - """Downloads and unzips excel files from DOWNLOAD_URI.""" - print(f'Downloading data') - r = requests.get(DOWNLOAD_URI) - z = zipfile.ZipFile(io.BytesIO(r.content)) - z.extractall(self.save_path) + # Ensure the save directory exists + os.makedirs(self.save_path, exist_ok=True) + + def check_url(self, url): + """ + Checks if a given URL is accessible. + + Args: + url (str): The URL to check. + + Returns: + bool: True if the URL is accessible, False otherwise. + """ + + try: + response = requests.head(url) + response.raise_for_status() + logging.info(f"URL is valid: {url}") + return True + except requests.RequestException as e: + logging.warning(f"URL check failed: {url}. Error: {e}") + return False + + def generate_and_validate(self, template, **kwargs): + """ + Generates a URL using a template and validates its existence. + Args: + template (str): The URL template with placeholders. + **kwargs: Key-value pairs for placeholders in the template. + + Returns: + str: The validated URL. + + Raises: + ValueError: If the URL is not valid. + """ + try: + url = template.format(**kwargs) + if self.check_url(url): + logging.info(f"Valid URL found: {url}") + return url # Return the valid URL and stop further processing + logging.info(f"URL not valid: {url}") + return None + except Exception as e: + logging.fatal( + f"Error occured while generating and validating the url: {e}") + + @retry(tries=3, delay=2, backoff=2, exceptions=(requests.RequestException,)) + def download_data(self, year, year_minus_1): + """ + Download a file from the specified URL with retry logic. + Downloads and unzips Excel files from dynamically generated DOWNLOAD_URI. + Args: + year (int): The current year for the data. + year_minus_1 (int): The previous year for the data. + """ + uri = self.generate_and_validate(download_url, + year=year, + year_minus_1=year_minus_1) + logging.info(f'Downloading data from {uri}') + try: + r = requests.get(uri) + r.raise_for_status() # Raise an error for unsuccessful responses + z = zipfile.ZipFile(io.BytesIO(r.content)) + for file in z.namelist(): + # Skip directories + if not file.endswith('/'): + target_path = os.path.join(self.save_path, + os.path.basename(file)) + with z.open(file) as source, open(target_path, + 'wb') as target: + target.write(source.read()) + logging.info(f"Successfully downloaded data for year: {year}") + except Exception as e: + logging.fatal(f"Failed to download or extract data for {year}: {e}") def extract_all_years(self): - """Saves relevant sheets from each year's Excel file to a csv.""" - headers = {} - for sheet, _ in SHEET_NAMES_TO_CSV_FILENAMES.items(): - headers[sheet] = {} - for current_year in self.years: - print(f'Extracting data for {current_year}') - self.current_year = current_year - self._extract_data(headers) - for sheet, csv_name in SHEET_NAMES_TO_CSV_FILENAMES.items(): - headers_df = pd.DataFrame.from_dict(headers[sheet], orient='index') - headers_df.transpose().to_csv(os.path.join(self.save_path, - f'cols_{csv_name}'), - index=None) - return self.files + """ + Saves relevant sheets from each year's Excel file to a CSV. + Returns: + list: A list of tuples containing (year, filename) for extracted files. + """ + try: + headers = {} + for sheet, _ in SHEET_NAMES_TO_CSV_FILENAMES.items(): + headers[sheet] = {} + for current_year in self.years: + logging.info(f'Extracting data for {current_year}') + self.current_year = current_year + self._extract_data(headers) + for sheet, csv_name in SHEET_NAMES_TO_CSV_FILENAMES.items(): + headers_df = pd.DataFrame.from_dict(headers[sheet], + orient='index') + headers_df.transpose().to_csv(os.path.join( + self.save_path, f'cols_{csv_name}'), + index=None) + return self.files + except Exception as e: + logging.fatal( + f"Error occured while extracting the years from the file: {e}") def save_all_crosswalks(self, filepath): - """Builds individual year crosswalks, as well as a join crosswalk for all years.""" - print(f'Saving all ID crosswalks') - crosswalks = [] - for current_year in self.years: - crosswalks.append(self._gen_crosswalk()) - all_crosswalks_df = pd.concat(crosswalks, join='outer') - all_crosswalks_df = all_crosswalks_df.sort_values( - by=[GHGRP_ID_COL, 'FRS Id', 'ORIS CODE']) - all_crosswalks_df = all_crosswalks_df.drop_duplicates() - all_crosswalks_df.to_csv(filepath, header=True, index=None) - return all_crosswalks_df + """ + Builds individual year crosswalks, as well as a joint crosswalk for all years. + Args: + filepath (str): The path where the combined crosswalk CSV will be saved. + + Returns: + pd.DataFrame: A DataFrame containing all combined crosswalks. + """ + logging.info('Saving all ID crosswalks') + try: + crosswalks = [] + for current_year in self.years: + crosswalks.append(self._gen_crosswalk()) + all_crosswalks_df = pd.concat(crosswalks, join='outer') + all_crosswalks_df = all_crosswalks_df.sort_values( + by=[GHGRP_ID_COL, 'FRS Id', 'ORIS CODE']) + all_crosswalks_df = all_crosswalks_df.drop_duplicates() + all_crosswalks_df.to_csv(filepath, header=True, index=None) + return all_crosswalks_df + except Exception as e: + logging.fatal(f"Error occured while saving all cross walks: {e}") def _csv_path(self, csv_filename, year=None): + """ + Generates the full path for a CSV file. + + Args: + csv_filename (str): The base filename for the CSV. + year (int, optional): The year associated with the file. Defaults to the current year. + + Returns: + str: The full path to the CSV file. + """ if not year: year = self.current_year return os.path.join(self.save_path, f'{year}_{csv_filename}') def _extract_data(self, headers): - summary_filename = os.path.join( - self.save_path, YEAR_DATA_FILENAME.format(year=self.current_year)) - xl = pd.ExcelFile(summary_filename, engine='openpyxl') - for sheet in xl.sheet_names: - csv_filename = SHEET_NAMES_TO_CSV_FILENAMES.get(sheet, None) - if not csv_filename: - print(f'Skipping sheet: {sheet}') - continue - summary_file = xl.parse(sheet, header=HEADER_ROW, dtype=str) - csv_filename = self._csv_path(csv_filename) - summary_file.to_csv(csv_filename, index=None, header=True) - headers[sheet][self.current_year] = summary_file.columns - self.files.append((self.current_year, csv_filename)) + """ + Extracts relevant sheets from an Excel file for the current year. + + Args: + headers (dict): A dictionary to store header information for each sheet. + + """ + try: + summary_filename = os.path.join( + self.save_path, + YEAR_DATA_FILENAME.format(year=self.current_year)) + + xl = pd.ExcelFile(summary_filename, engine='openpyxl') + logging.info( + f"Available sheets in {summary_filename}: {xl.sheet_names}") + check_list = [] + for sheet in xl.sheet_names: + csv_filename = get_csv_filename(sheet) + check_list.append(csv_filename) + if not csv_filename: + logging.info(f'Skipping sheet: {sheet}') + continue + summary_file = xl.parse(sheet, header=HEADER_ROW, dtype=str) + csv_path = self._csv_path(csv_filename) + summary_file.to_csv(csv_path, index=None, header=True) + headers.setdefault(sheet, + {})[self.current_year] = summary_file.columns + self.files.append((self.current_year, csv_path)) + if "direct_emitters.csv" not in check_list: + logging.fatal( + f"'direct_emitters.csv' not found in the sheets for {self.current_year}. Aborting!" + ) + except Exception as e: + logging.fatal( + f"Error occured while processing the sheet names: {e}") def _gen_crosswalk(self): - # Per https://stackoverflow.com/a/56230607 + """ + Generates a crosswalk DataFrame for the current year. + + Returns: + pd.DataFrame: A DataFrame containing crosswalk data for the current year. + """ ssl._create_default_https_context = ssl._create_unverified_context + try: + oris_df = pd.read_excel(self.generate_and_validate( + crosswalk_url, yr=self.current_year), + 'ORIS Crosswalk', + header=0, + dtype=str, + usecols=CROSSWALK_COLS_TO_KEEP, + engine='openpyxl') + except Exception: + logging.warning(f"Using fallback CROSSWALK_URI for 2022") + oris_df = pd.read_excel(self.generate_and_validate(crosswalk_url, + yr=2022), + 'ORIS Crosswalk', + header=0, + dtype=str, + usecols=CROSSWALK_COLS_TO_KEEP, + engine='openpyxl') - oris_df = pd.read_excel(CROSSWALK_URI, - 'ORIS Crosswalk', - header=0, - dtype=str, - usecols=CROSSWALK_COLS_TO_KEEP, - engine='openpyxl') oris_df = oris_df.rename(columns={'GHGRP Facility ID': GHGRP_ID_COL}) all_facilities_df = pd.DataFrame() for sheet, csv_filename in SHEET_NAMES_TO_CSV_FILENAMES.items(): @@ -137,15 +292,28 @@ def _gen_crosswalk(self): df = pd.read_csv(csv_path, usecols=[GHGRP_ID_COL, 'FRS Id'], dtype=str) - all_facilities_df = all_facilities_df.append(df) + all_facilities_df = pd.concat([all_facilities_df, df], + ignore_index=True) all_facilities_df = all_facilities_df.join( oris_df.set_index(GHGRP_ID_COL), on=GHGRP_ID_COL, how='left') return all_facilities_df if __name__ == '__main__': - downloader = Downloader('tmp_data') - downloader.download_data() - downloader.extract_all_years() - downloader.save_all_crosswalks( - os.path.join(self.save_path, 'crosswalks.csv')) + try: + # Initialize downloader + url_year = datetime.now().year + downloader = Downloader('tmp_data', url_year) + + # Loop through years to download data + for year in range(2024, 2050): + if year <= datetime.now().year: + logging.info(f"Downloading data for year: {year}") + try: + downloader.download_data(year, year - 1) + except Exception as e: + logging.fatal( + f"Failed to download data for year {year}. Error: {e}") + + except Exception as e: + logging.fatal(f"An unexpected error occurred: {e}") diff --git a/scripts/us_epa/ghgrp/gen_data.sh b/scripts/us_epa/ghgrp/gen_data.sh deleted file mode 100755 index 36398bf492..0000000000 --- a/scripts/us_epa/ghgrp/gen_data.sh +++ /dev/null @@ -1,15 +0,0 @@ -#!/bin/bash -# Script used to generate TMCF/CSV/MCF for EPA GHGRP - -pushd ../../../ -python3 -m venv .env -source .env/bin/activate -pip3 install -r requirements_all.txt -q -popd - -# Generate schema to import_data/ -python3 -m gas -python3 -m sources - -# Download and process data, output CSV written to import_data/ -python3 -m process diff --git a/scripts/us_epa/ghgrp/manifest.json b/scripts/us_epa/ghgrp/manifest.json new file mode 100644 index 0000000000..a473363cfa --- /dev/null +++ b/scripts/us_epa/ghgrp/manifest.json @@ -0,0 +1,20 @@ +{ + "import_specifications": [ + { + "import_name": "EPA_GHGRP", + "curator_emails": ["support@datacommons.org"], + "provenance_url": "https://www.epa.gov/ghgreporting", + "provenance_description": "EPA emissions data reported as part of the Greenhouse Gas Reporting Program (GHGRP).", + "scripts": ["gas.py","sources.py","download.py","process.py"], + "import_inputs": [ + { + "template_mcf": "import_data/observations.tmcf", + "cleaned_csv": "import_data/all_data.csv" + } + ], + "cron_schedule": "0 10 1,15 * *", + "source_files": ["tmp_data/*"] + } + ] +} + diff --git a/scripts/us_epa/ghgrp/process.py b/scripts/us_epa/ghgrp/process.py index 6dbfa8faf0..6f37d7f468 100644 --- a/scripts/us_epa/ghgrp/process.py +++ b/scripts/us_epa/ghgrp/process.py @@ -15,8 +15,9 @@ import os import sys -import unittest import csv +from datetime import datetime +from absl import app, logging # Allows the following module imports to work when running as a script sys.path.append( @@ -25,6 +26,7 @@ from us_epa.ghgrp import download, gas, sources from us_epa.util import crosswalk as cw +# Define constants _FACILITY_ID = 'Facility Id' _DCID = 'dcid' _SV = 'sv' @@ -36,46 +38,91 @@ def process_data(data_filepaths, crosswalk, out_filepath): - print(f'Writing to {out_filepath}') - with open(out_filepath, 'w') as out_fp: - csv_writer = csv.DictWriter(out_fp, fieldnames=_OUT_FIELDNAMES) - csv_writer.writeheader() - all_processed_facilities = {} # map of year -> set(dcid) - for (year, filepath) in data_filepaths: - print(f'Processing {filepath}') - year_processed_facilities = all_processed_facilities.get( - year, set()) - with open(filepath, 'r') as fp: - for row in csv.DictReader(fp): - if not row[_FACILITY_ID]: - continue - dcid = crosswalk.get_dcid(row[_FACILITY_ID]) - assert dcid - if dcid in year_processed_facilities: - continue - for key, value in row.items(): - if not value: + """Processes multiple CSV data files and writes the output to a single CSV file. + + Args: + data_filepaths (list of tuples): A list containing tuples of (year, file path). + crosswalk (Crosswalk): An instance of the Crosswalk class for mapping facility IDs. + out_filepath (str): The output file path where processed data will be stored. + + Returns: + None + """ + + logging.info(f'Writing to {out_filepath}') + try: + with open(out_filepath, 'w') as out_fp: + csv_writer = csv.DictWriter(out_fp, fieldnames=_OUT_FIELDNAMES) + csv_writer.writeheader() + all_processed_facilities = {} # map of year -> set(dcid) + count = 0 + for (year, filepath) in data_filepaths: + logging.info(f'Processing {filepath}') + year_processed_facilities = all_processed_facilities.get( + year, set()) + with open(filepath, 'r') as fp: + for row in csv.DictReader(fp): + if not row[_FACILITY_ID]: continue - sv = gas.col_to_sv(key) - if not sv: - sv = sources.col_to_sv(key) - if not sv: + dcid = crosswalk.get_dcid(row[_FACILITY_ID]) + assert dcid + if dcid in year_processed_facilities: + continue + for key, value in row.items(): + if not value: continue - csv_writer.writerow({ - _DCID: f'dcid:{dcid}', - _SV: f'dcid:{sv}', - _YEAR: year, - _VALUE: value - }) - year_processed_facilities.add(dcid) - all_processed_facilities[year] = year_processed_facilities + sv = gas.col_to_sv(key) + if not sv: + sv = sources.col_to_sv(key) + if not sv: + continue + csv_writer.writerow({ + _DCID: f'dcid:{dcid}', + _SV: f'dcid:{sv}', + _YEAR: year, + _VALUE: value + }) + year_processed_facilities.add(dcid) + all_processed_facilities[year] = year_processed_facilities + count += 1 + logging.info(f"Number of files processed:{count}") + except Exception as e: + logging.fatal(f"Aborting processing due to the error: {e}") + + +def main(_): + try: + # Initialize downloader + url_year = datetime.now().year + downloader = download.Downloader('tmp_data', url_year) + + # Extract all years + logging.info("Starting extraction of all years.") + files = downloader.extract_all_years() + logging.info(f"Extraction complete. Files: {files}") + + # Generate and save crosswalk file + crosswalk_file = os.path.join(_SAVE_PATH, 'crosswalks.csv') + logging.info(f"Saving crosswalk file to: {crosswalk_file}") + downloader.save_all_crosswalks(crosswalk_file) + logging.info("Crosswalk file saved successfully.") + + # Initialize Crosswalk + logging.info( + f"Initializing Crosswalk object with file: {crosswalk_file}") + crosswalk = cw.Crosswalk(crosswalk_file) + + # Process data + output_file = os.path.join(_OUT_PATH, 'all_data.csv') + logging.info(f"Processing data and saving output to: {output_file}") + process_data(files, crosswalk, output_file) + logging.info("Data processing completed successfully.") + + except FileNotFoundError as e: + logging.fatal(f"File not found: {e}") + except Exception as e: + logging.fatal(f"An unexpected error occurred: {e}") if __name__ == '__main__': - downloader = download.Downloader(_SAVE_PATH) - downloader.download_data() - files = downloader.extract_all_years() - crosswalk_file = os.path.join(_SAVE_PATH, 'crosswalks.csv') - downloader.save_all_crosswalks(crosswalk_file) - crosswalk = cw.Crosswalk(crosswalk_file) - process_data(files, crosswalk, os.path.join(_OUT_PATH, 'all_data.csv')) + app.run(main) diff --git a/scripts/us_epa/ghgrp/process_test.py b/scripts/us_epa/ghgrp/process_test.py index 468058f68d..dab95e662e 100644 --- a/scripts/us_epa/ghgrp/process_test.py +++ b/scripts/us_epa/ghgrp/process_test.py @@ -42,17 +42,17 @@ def test_process_direct_emitters(self): fname = 'all_data.csv' got_filepath = os.path.join(tmp_dir, fname) process.process_data([ - ('2010', os.path.join(_RAW_DATA_DIR, - '2010_direct_emitters.csv')), - ('2012', os.path.join(_RAW_DATA_DIR, '2012_elec_equip.csv')), - ('2013', os.path.join(_RAW_DATA_DIR, '2013_oil_and_gas.csv')), - ('2016', + (2010, os.path.join(_RAW_DATA_DIR, '2010_direct_emitters.csv')), + (2011, os.path.join(_RAW_DATA_DIR, '2011_direct_emitters.csv')), + (2012, os.path.join(_RAW_DATA_DIR, '2012_elec_equip.csv')), + (2013, os.path.join(_RAW_DATA_DIR, + '2013_local_distribution.csv')), + (2014, os.path.join(_RAW_DATA_DIR, + '2014_local_distribution.csv')), + (2016, os.path.join(_RAW_DATA_DIR, '2016_gathering_and_boosting.csv')), - ('2017', - os.path.join(_RAW_DATA_DIR, '2017_local_distribution.csv')), - ('2019', os.path.join(_RAW_DATA_DIR, - '2019_direct_emitters.csv')), + (2016, os.path.join(_RAW_DATA_DIR, '2016_oil_and_gas.csv')) ], crosswalk, got_filepath) with open(got_filepath) as gotf: got = gotf.read() diff --git a/scripts/us_epa/ghgrp/test_data/expected/all_data.csv b/scripts/us_epa/ghgrp/test_data/expected/all_data.csv index 197b51d41d..e6d55a34e9 100644 --- a/scripts/us_epa/ghgrp/test_data/expected/all_data.csv +++ b/scripts/us_epa/ghgrp/test_data/expected/all_data.csv @@ -1,62 +1,121 @@ -dcid,sv,year,value -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,82959.744 -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,82875.9 -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_Methane_NonBiogenic,2010,38.25 -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,45.594 -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,362.8 -dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_ElectricityGeneration_NonBiogenic,2010,82596.944 -dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,25176.656 -dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,25150.9 -dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_Methane_NonBiogenic,2010,11.75 -dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,14.006 -dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,25176.656 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,37277 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,0 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_Methane_NonBiogenic,2010,37277 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_CarbonDioxide_Biogenic,2010,1.7 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,0 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_MunicipalLandfills_NonBiogenic,2010,37277 -dcid:epaGhgrpFacilityId/1004063,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,17777.684 -dcid:epaGhgrpFacilityId/1004063,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,17759.6 -dcid:epaGhgrpFacilityId/1004063,dcid:Annual_Emissions_Methane_NonBiogenic,2010,8.25 -dcid:epaGhgrpFacilityId/1004063,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,9.834 -dcid:epaGhgrpFacilityId/1004063,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,17777.684 -dcid:epaGhgrpFacilityId/1010527,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,0 -dcid:epaGhgrpFacilityId/1009620,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,100753.2 -dcid:epaGhgrpFacilityId/1009620,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,100753.2 -dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,163013.8 -dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,59015.6 -dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_Methane_NonBiogenic,2013,103953.5 -dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2013,44.7 -dcid:epaGhgrpFacilityId/1008232,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,40908.05 -dcid:epaGhgrpFacilityId/1008232,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,297.3 -dcid:epaGhgrpFacilityId/1008232,dcid:Annual_Emissions_Methane_NonBiogenic,2013,40610.75 -dcid:epaGhgrpFacilityId/1012491,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,219181.668 -dcid:epaGhgrpFacilityId/1012491,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,174989.4 -dcid:epaGhgrpFacilityId/1012491,dcid:Annual_Emissions_Methane_NonBiogenic,2016,44038.5 -dcid:epaGhgrpFacilityId/1012491,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,153.768 -dcid:epaGhgrpFacilityId/1012814,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,51315.808 -dcid:epaGhgrpFacilityId/1012814,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,47713.4 -dcid:epaGhgrpFacilityId/1012814,dcid:Annual_Emissions_Methane_NonBiogenic,2016,3469.5 -dcid:epaGhgrpFacilityId/1012814,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,132.908 -dcid:epaGhgrpFacilityId/1001277,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2017,110810.65 -dcid:epaGhgrpFacilityId/1001277,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2017,133.4 -dcid:epaGhgrpFacilityId/1001277,dcid:Annual_Emissions_Methane_NonBiogenic,2017,110677.25 -dcid:epaGhgrpFacilityId/1001277,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2017,6392 -dcid:epaGhgrpFacilityId/1011115,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2017,33870.3 -dcid:epaGhgrpFacilityId/1011115,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2017,40.8 -dcid:epaGhgrpFacilityId/1011115,dcid:Annual_Emissions_Methane_NonBiogenic,2017,33829.5 -dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2019,518680.25 -dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_Methane_NonBiogenic,2019,518680.25 -dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_MunicipalLandfills_NonBiogenic,2019,518680.25 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2019,916250.412 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2019,915046.8 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_Methane_NonBiogenic,2019,445.5 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2019,758.112 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2019,2104.992 -dcid:epaGhgrpFacilityId/1007606,dcid:Annual_Emissions_GreenhouseGas_CementProduction_NonBiogenic,2019,914145.42 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2019,82134.75 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2019,0 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_Methane_NonBiogenic,2019,82134.75 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2019,0 -dcid:epaGhgrpFacilityId/1011696,dcid:Annual_Emissions_GreenhouseGas_MunicipalLandfills_NonBiogenic,2019,82134.75 +dcid,sv,year,value +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,0 +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,0 +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_MunicipalLandfills_NonBiogenic,2010,0 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,82959.744 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,82875.9 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_Methane_NonBiogenic,2010,38.25 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,45.594 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,362.8 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_ElectricityGeneration_NonBiogenic,2010,82596.944 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,25176.656 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,25150.9 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_Methane_NonBiogenic,2010,11.75 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,14.006 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,25176.656 +dcid:epaGhgrpFacilityId/1002885,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,38883.204 +dcid:epaGhgrpFacilityId/1002885,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,38843.2 +dcid:epaGhgrpFacilityId/1002885,dcid:Annual_Emissions_Methane_NonBiogenic,2010,18.25 +dcid:epaGhgrpFacilityId/1002885,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,21.754 +dcid:epaGhgrpFacilityId/1002885,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,38883.204 +dcid:epaGhgrpFacilityId/1002707,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2010,63884.36 +dcid:epaGhgrpFacilityId/1002707,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2010,63818.6 +dcid:epaGhgrpFacilityId/1002707,dcid:Annual_Emissions_Methane_NonBiogenic,2010,30 +dcid:epaGhgrpFacilityId/1002707,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2010,35.76 +dcid:epaGhgrpFacilityId/1002707,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2010,63884.36 +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2011,194000 +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_Methane_NonBiogenic,2011,194000 +dcid:epaGhgrpFacilityId/1004377,dcid:Annual_Emissions_GreenhouseGas_MunicipalLandfills_NonBiogenic,2011,194000 +dcid:epaGhgrpFacilityId/1010040,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2011,390393.5 +dcid:epaGhgrpFacilityId/1010040,dcid:Annual_Emissions_Methane_NonBiogenic,2011,390393.5 +dcid:epaGhgrpFacilityId/1010040,dcid:Annual_Emissions_GreenhouseGas_UndergroundCoalMines_NonBiogenic,2011,390393.5 +dcid:epaGhgrpFacilityId/1010085,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2011,64664.5 +dcid:epaGhgrpFacilityId/1010085,dcid:Annual_Emissions_Methane_NonBiogenic,2011,64664.5 +dcid:epaGhgrpFacilityId/1010085,dcid:Annual_Emissions_GreenhouseGas_UndergroundCoalMines_NonBiogenic,2011,64664.5 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2011,100591.828 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2011,100489.9 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_Methane_NonBiogenic,2011,46.5 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2011,55.428 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2011,289.7 +dcid:epaGhgrpFacilityId/1000112,dcid:Annual_Emissions_GreenhouseGas_ElectricityGeneration_NonBiogenic,2011,100302.128 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2011,19389.57 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2011,19368.4 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_Methane_NonBiogenic,2011,9.25 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2011,11.92 +dcid:epaGhgrpFacilityId/1006394,dcid:Annual_Emissions_GreenhouseGas_StationaryCombustion_NonBiogenic,2011,19389.57 +dcid:epaGhgrpFacilityId/1003708,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,88826.52 +dcid:epaGhgrpFacilityId/1003708,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,88826.52 +dcid:epaGhgrpFacilityId/1010640,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,7736.04 +dcid:epaGhgrpFacilityId/1010640,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,7736.04 +dcid:epaGhgrpFacilityId/1010811,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,91298.04 +dcid:epaGhgrpFacilityId/1010811,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,91298.04 +dcid:epaGhgrpFacilityId/1010812,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,14322.96 +dcid:epaGhgrpFacilityId/1010812,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,14322.96 +dcid:epaGhgrpFacilityId/1009444,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2012,33518.28 +dcid:epaGhgrpFacilityId/1009444,dcid:Annual_Emissions_SulfurHexafluoride_NonBiogenic,2012,33518.28 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,75662.2 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,1236.7 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_Methane_NonBiogenic,2013,74425.5 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,13353.6 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,16.1 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_Methane_NonBiogenic,2013,13337.5 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,10821.8 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,12.8 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_Methane_NonBiogenic,2013,10809 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,3111.7 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,3.7 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_Methane_NonBiogenic,2013,3108 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2013,155513.8 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2013,177.3 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_Methane_NonBiogenic,2013,155336.5 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2014,75801.6 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2014,1873.1 +dcid:epaGhgrpFacilityId/1008026,dcid:Annual_Emissions_Methane_NonBiogenic,2014,73928.5 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2014,13412.6 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2014,16.1 +dcid:epaGhgrpFacilityId/1004034,dcid:Annual_Emissions_Methane_NonBiogenic,2014,13396.5 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2014,10870.5 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2014,12.5 +dcid:epaGhgrpFacilityId/1004975,dcid:Annual_Emissions_Methane_NonBiogenic,2014,10858 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2014,2447.55 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2014,2.8 +dcid:epaGhgrpFacilityId/1006481,dcid:Annual_Emissions_Methane_NonBiogenic,2014,2444.75 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2014,155671.85 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2014,178.1 +dcid:epaGhgrpFacilityId/1007872,dcid:Annual_Emissions_Methane_NonBiogenic,2014,155493.75 +dcid:epaGhgrpFacilityId/1012507,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,44304.292 +dcid:epaGhgrpFacilityId/1012507,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,16724.9 +dcid:epaGhgrpFacilityId/1012507,dcid:Annual_Emissions_Methane_NonBiogenic,2016,27570.75 +dcid:epaGhgrpFacilityId/1012507,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,8.642 +dcid:epaGhgrpFacilityId/1012156,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,46921.114 +dcid:epaGhgrpFacilityId/1012156,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,35166.1 +dcid:epaGhgrpFacilityId/1012156,dcid:Annual_Emissions_Methane_NonBiogenic,2016,11734.75 +dcid:epaGhgrpFacilityId/1012156,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,20.264 +dcid:epaGhgrpFacilityId/1012155,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,78994.21 +dcid:epaGhgrpFacilityId/1012155,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,65490.2 +dcid:epaGhgrpFacilityId/1012155,dcid:Annual_Emissions_Methane_NonBiogenic,2016,13468.25 +dcid:epaGhgrpFacilityId/1012155,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,35.76 +dcid:epaGhgrpFacilityId/1012472,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,55733.472 +dcid:epaGhgrpFacilityId/1012472,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,51896.2 +dcid:epaGhgrpFacilityId/1012472,dcid:Annual_Emissions_Methane_NonBiogenic,2016,3810.75 +dcid:epaGhgrpFacilityId/1012472,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,26.522 +dcid:epaGhgrpFacilityId/1012466,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,177420.494 +dcid:epaGhgrpFacilityId/1012466,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,57531.8 +dcid:epaGhgrpFacilityId/1012466,dcid:Annual_Emissions_Methane_NonBiogenic,2016,119858 +dcid:epaGhgrpFacilityId/1012466,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,30.694 +dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,261382.84 +dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,154176.7 +dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_Methane_NonBiogenic,2016,107115.25 +dcid:epaGhgrpFacilityId/1000355,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,90.89 +dcid:epaGhgrpFacilityId/1009263,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,3181.694 +dcid:epaGhgrpFacilityId/1009263,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,1730.8 +dcid:epaGhgrpFacilityId/1009263,dcid:Annual_Emissions_Methane_NonBiogenic,2016,1450 +dcid:epaGhgrpFacilityId/1009263,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,0.894 +dcid:epaGhgrpFacilityId/1009238,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,808767.966 +dcid:epaGhgrpFacilityId/1009238,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,600130.6 +dcid:epaGhgrpFacilityId/1009238,dcid:Annual_Emissions_Methane_NonBiogenic,2016,208416.25 +dcid:epaGhgrpFacilityId/1009238,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,221.116 +dcid:epaGhgrpFacilityId/1009283,dcid:Annual_Emissions_GreenhouseGas_NonBiogenic,2016,57168.136 +dcid:epaGhgrpFacilityId/1009283,dcid:Annual_Emissions_CarbonDioxide_NonBiogenic,2016,12931.4 +dcid:epaGhgrpFacilityId/1009283,dcid:Annual_Emissions_Methane_NonBiogenic,2016,44219.75 +dcid:epaGhgrpFacilityId/1009283,dcid:Annual_Emissions_NitrousOxide_NonBiogenic,2016,16.986 diff --git a/scripts/us_epa/ghgrp/test_data/input/2010_direct_emitters.csv b/scripts/us_epa/ghgrp/test_data/input/2010_direct_emitters.csv index 487e484c35..f4981d12ee 100644 --- a/scripts/us_epa/ghgrp/test_data/input/2010_direct_emitters.csv +++ b/scripts/us_epa/ghgrp/test_data/input/2010_direct_emitters.csv @@ -1,5 +1,6 @@ Facility Id,FRS Id,Facility Name,City,State,Zip Code,Address,County,Latitude,Longitude,Primary NAICS Code,Industry Type (subparts),Industry Type (sectors),Total reported direct emissions,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,HFC emissions,PFC emissions,SF6 emissions ,NF3 emissions,Other Fully Fluorinated GHG emissions,HFE emissions,Very Short-lived Compounds emissions,Other GHGs (metric tons CO2e),Biogenic CO2 emissions (metric tons),Stationary Combustion,Electricity Generation,Adipic Acid Production,Aluminum Production,Ammonia Manufacturing,Cement Production,Ferroalloy Production,Glass Production,HCFC–22 Production from HFC–23 Destruction,Hydrogen Production,Iron and Steel Production,Lead Production,Lime Production,Miscellaneous Use of Carbonates,Nitric Acid Production,Petrochemical Production,Petroleum Refining,Phosphoric Acid Production,Pulp and Paper Manufacturing,Silicon Carbide Production,Soda Ash Manufacturing,Titanium Dioxide Production,Zinc Production,Municipal Landfills,Is some CO2 collected on-site and used to manufacture other products and therefore not emitted from the affected manufacturing process unit(s)? (as reported under Subpart G or S),"Is some CO2 reported as emissions from the affected manufacturing process unit(s) under Subpart AA, G or P collected and transferred off-site or injected (as reported under Subpart PP)?",Does the facility employ continuous emissions monitoring? +1004377,110043803578,121 REGIONAL DISPOSAL FACILITY,MELISSA,TX,75454,3820 SAM RAYBURN HIGHWAY,COLLIN COUNTY,33.29857,-96.53586,562212,HH,Waste,0,0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0,N,N,N 1000112,110019827286,23rd and 3rd,BROOKLYN,NY,11232,730 3rd Avenue,Kings,40.663,-74,221112,"C,D",Power Plants,82959.744,82875.9,38.25,45.594,,,,,,,,,,362.8,82596.944,,,,,,,,,,,,,,,,,,,,,,,N,N,N 1006394,,29-6 #2 Central Delivery Point,Blanco,NM,87412,,Rio Arriba,36.7452,-107.4455,213112,C (Abbr),Petroleum and Natural Gas Systems,25176.656,25150.9,11.75,14.006,,,,,,,,,,25176.656,,,,,,,,,,,,,,,,,,,,,,,,N,N,N -1011696,110064007550,white oak landfill,waynesville,NC,28785,3898 fines creek rd,HAYWOOD COUNTY,35.661943,-82.996087,562212,"C,HH",Waste,37277,0,37277,,,,,,,,,,1.7,0,,,,,,,,,,,,,,,,,,,,,,,37277,N,N,N -1004063,110043803989,City of Charlottesville,Charlottesville,VA,22902,605 East Main St,CHARLOTTESVILLE CITY,38.0296,-78.47772,221210,"C,NN-LDC","Natural Gas and Natural Gas Liquids Suppliers,Other",17777.684,17759.6,8.25,9.834,,,,,,,,,,17777.684,,,,,,,,,,,,,,,,,,,,,,,,N,N,N \ No newline at end of file +1002885,,30-5 Central Delivery Point Compressor Station,Aztec,NM,87410,,Rio Arriba,36.8118,-107.4036,213112,C (Abbr),Petroleum and Natural Gas Systems,38883.204,38843.2,18.25,21.754,,,,,,,,,,38883.204,,,,,,,,,,,,,,,,,,,,,,,,N,N,N +1002707,,31-6 Central Delivery Point,BLOOMFIELD,NM,87413,,Rio Arriba,36.8363,-107.4199,213112,C (Abbr),Petroleum and Natural Gas Systems,63884.36,63818.6,30,35.76,,,,,,,,,,63884.36,,,,,,,,,,,,,,,,,,,,,,,,N,N,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2010_local_distribution.csv b/scripts/us_epa/ghgrp/test_data/input/2010_local_distribution.csv deleted file mode 100644 index 937a47bd30..0000000000 --- a/scripts/us_epa/ghgrp/test_data/input/2010_local_distribution.csv +++ /dev/null @@ -1,2 +0,0 @@ -Facility Id,FRS Id,Facility Name,State where Emissions Occur,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Local Distribution Companies,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? ,Unnamed: 18,Unnamed: 19,Unnamed: 20,Unnamed: 21,Unnamed: 22,Unnamed: 23,Unnamed: 24,Unnamed: 25,Unnamed: 26,Unnamed: 27,Unnamed: 28,Unnamed: 29,Unnamed: 30,Unnamed: 31,Unnamed: 32,Unnamed: 33,Unnamed: 34,Unnamed: 35,Unnamed: 36,Unnamed: 37,Unnamed: 38,Unnamed: 39,Unnamed: 40,Unnamed: 41,Unnamed: 42,Unnamed: 43,Unnamed: 44,Unnamed: 45,Unnamed: 46,Unnamed: 47,Unnamed: 48,Unnamed: 49,Unnamed: 50,Unnamed: 51,Unnamed: 52,Unnamed: 53,Unnamed: 54,Unnamed: 55,Unnamed: 56,Unnamed: 57,Unnamed: 58,Unnamed: 59 -1004063,110043803989,City of Charlottesville,VA,Charlottesville,VA,22902,605 East Main St,CHARLOTTESVILLE CITY,38.0296,-78.47772,221210,"C,NN-LDC,W-LDC",1440,2,1438,,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file diff --git a/scripts/us_epa/ghgrp/test_data/input/2019_direct_emitters.csv b/scripts/us_epa/ghgrp/test_data/input/2011_direct_emitters.csv similarity index 69% rename from scripts/us_epa/ghgrp/test_data/input/2019_direct_emitters.csv rename to scripts/us_epa/ghgrp/test_data/input/2011_direct_emitters.csv index 7579e32f6f..af1d17da4d 100644 --- a/scripts/us_epa/ghgrp/test_data/input/2019_direct_emitters.csv +++ b/scripts/us_epa/ghgrp/test_data/input/2011_direct_emitters.csv @@ -1,5 +1,6 @@ -Facility Id,FRS Id,Facility Name,City,State,Zip Code,Address,County,Latitude,Longitude,Primary NAICS Code,Industry Type (subparts),Industry Type (sectors),Total reported direct emissions,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,HFC emissions,PFC emissions,SF6 emissions ,NF3 emissions,Other Fully Fluorinated GHG emissions,HFE emissions,Very Short-lived Compounds emissions,Other GHGs (metric tons CO2e),Biogenic CO2 emissions (metric tons),Stationary Combustion,Electricity Generation,Adipic Acid Production,Aluminum Production,Ammonia Manufacturing,Cement Production,Electronics Manufacture,Ferroalloy Production,Fluorinated GHG Production,Glass Production,HCFC–22 Production from HFC–23 Destruction,Hydrogen Production,Iron and Steel Production,Lead Production,Lime Production,Magnesium Production,Miscellaneous Use of Carbonates,Nitric Acid Production,Petroleum and Natural Gas Systems – Offshore Production,Petroleum and Natural Gas Systems – Processing,Petroleum and Natural Gas Systems – Transmission/Compression,Petroleum and Natural Gas Systems – Underground Storage,Petroleum and Natural Gas Systems – LNG Storage,Petroleum and Natural Gas Systems – LNG Import/Export,Petrochemical Production,Petroleum Refining,Phosphoric Acid Production,Pulp and Paper Manufacturing,Silicon Carbide Production,Soda Ash Manufacturing,Titanium Dioxide Production,Underground Coal Mines,Zinc Production,Municipal Landfills,Industrial Wastewater Treatment,Manufacture of Electric Transmission and Distribution Equipment,Industrial Waste Landfills,Is some CO2 collected on-site and used to manufacture other products and therefore not emitted from the affected manufacturing process unit(s)? (as reported under Subpart G or S),"Is some CO2 reported as emissions from the affected manufacturing process unit(s) under Subpart AA, G or P collected and transferred off-site or injected (as reported under Subpart PP)?",Does the facility employ continuous emissions monitoring? ,Unnamed: 66 -1004377,110043803578,121 REGIONAL DISPOSAL FACILITY,MELISSA,TX,75454,3820 SAM RAYBURN HIGHWAY,COLLIN COUNTY,33.29857,-96.53586,562212,HH,Waste,518680.25,,518680.25,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,518680.25,,,,N,N,N, -1007606,110000597729,ASH GROVE CEMENT-FOREMAN,Foreman,AR,71836,4343 HWY 108,LITTLE RIVER COUNTY,33.6936,-94.4166,327310,"C,H",Minerals,916250.412,915046.8,445.5,758.112,,,,,,,,,,2104.992,,,,,914145.42,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,N,N,N, -1011696,110064007550,white oak landfill,waynesville,NC,28785,3898 fines creek rd,HAYWOOD COUNTY,35.661943,-82.996087,562212,"C,HH",Waste,82134.75,0,82134.75,,,,,,,,,,,0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,82134.75,,,,N,N,N, -,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file +Facility Id,FRS Id,Facility Name,City,State,Zip Code,Address,County,Latitude,Longitude,Primary NAICS Code,Industry Type (subparts),Industry Type (sectors),Total reported direct emissions,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,HFC emissions,PFC emissions,SF6 emissions ,NF3 emissions,Other Fully Fluorinated GHG emissions,HFE emissions,Very Short-lived Compounds emissions,Other GHGs (metric tons CO2e),Biogenic CO2 emissions (metric tons),Stationary Combustion,Electricity Generation,Adipic Acid Production,Aluminum Production,Ammonia Manufacturing,Cement Production,Electronics Manufacture,Ferroalloy Production,Fluorinated GHG Production,Glass Production,HCFC–22 Production from HFC–23 Destruction,Hydrogen Production,Iron and Steel Production,Lead Production,Lime Production,Magnesium Production,Miscellaneous Use of Carbonates,Nitric Acid Production,Petroleum and Natural Gas Systems – Offshore Production,Petroleum and Natural Gas Systems – Processing,Petroleum and Natural Gas Systems – Transmission/Compression,Petroleum and Natural Gas Systems – Underground Storage,Petroleum and Natural Gas Systems – LNG Storage,Petroleum and Natural Gas Systems – LNG Import/Export,Petrochemical Production,Petroleum Refining,Phosphoric Acid Production,Pulp and Paper Manufacturing,Silicon Carbide Production,Soda Ash Manufacturing,Titanium Dioxide Production,Underground Coal Mines,Zinc Production,Municipal Landfills,Industrial Wastewater Treatment,Manufacture of Electric Transmission and Distribution Equipment,Industrial Waste Landfills,Is some CO2 collected on-site and used to manufacture other products and therefore not emitted from the affected manufacturing process unit(s)? (as reported under Subpart G or S),"Is some CO2 reported as emissions from the affected manufacturing process unit(s) under Subpart AA, G or P collected and transferred off-site or injected (as reported under Subpart PP)?",Does the facility employ continuous emissions monitoring? +1004377,110043803578,121 REGIONAL DISPOSAL FACILITY,MELISSA,TX,75454,3820 SAM RAYBURN HIGHWAY,COLLIN COUNTY,33.29857,-96.53586,562212,HH,Waste,194000,,194000,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,194000,,,,N,N,N +1010040,110070082056,15-18565/15-18662,Hazard,KY,40701,4200 S. Hwy 15,PERRY COUNTY,37.219099,-83.156046,212112,FF,Other,390393.5,,390393.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,390393.5,,,,,,N,N,N +1010085,110055519176,15-19015,Hazard,KY,41701,1845 S. KY HWY 15,PERRY,37.236617,-83.18126,212112,FF,Other,64664.5,,64664.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,64664.5,,,,,,N,N,N +1000112,110019827286,23rd and 3rd,BROOKLYN,NY,11232,730 3rd Avenue,Kings,40.663,-74,221112,"C,D",Power Plants,100591.828,100489.9,46.5,55.428,,,,,,,,,,289.7,100302.128,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,N,N,N +1006394,,29-6 #2 Central Delivery Point,Blanco,NM,87412,,Rio Arriba,36.7452,-107.4455,213112,C,Petroleum and Natural Gas Systems,19389.57,19368.4,9.25,11.92,,,,,,,,,,19389.57,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,N,N,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2012_elec_equip.csv b/scripts/us_epa/ghgrp/test_data/input/2012_elec_equip.csv index 3020e4ab8f..cf378bd8ab 100644 --- a/scripts/us_epa/ghgrp/test_data/input/2012_elec_equip.csv +++ b/scripts/us_epa/ghgrp/test_data/input/2012_elec_equip.csv @@ -1,3 +1,6 @@ -Facility Id,FRS Id,Facility Name,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Electrical Equipment Use,SF6 emissions ,Does the facility employ continuous emissions monitoring? ,Unnamed: 15,Unnamed: 16,Unnamed: 17,Unnamed: 18,Unnamed: 19,Unnamed: 20,Unnamed: 21,Unnamed: 22,Unnamed: 23,Unnamed: 24,Unnamed: 25,Unnamed: 26,Unnamed: 27,Unnamed: 28,Unnamed: 29,Unnamed: 30,Unnamed: 31,Unnamed: 32,Unnamed: 33,Unnamed: 34,Unnamed: 35,Unnamed: 36,Unnamed: 37,Unnamed: 38,Unnamed: 39,Unnamed: 40,Unnamed: 41,Unnamed: 42,Unnamed: 43,Unnamed: 44,Unnamed: 45,Unnamed: 46,Unnamed: 47,Unnamed: 48,Unnamed: 49,Unnamed: 50,Unnamed: 51,Unnamed: 52,Unnamed: 53,Unnamed: 54,Unnamed: 55,Unnamed: 56,Unnamed: 57,Unnamed: 58,Unnamed: 59 -1010527,110049258772,ITC Great Plains,Novi,MI,48377,27175 Energy Way,OAKLAND COUNTY,42.4926,-83.44298,221121,DD,0,,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, -1009620,110017609346,"Westar Energy, Inc.",Topeka,KS,66612,818 S Kansas Ave,SHAWNEE COUNTY,39.04854,-95.67468,221121,DD,100753.2,100753.2,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file +Facility Id,FRS Id,Facility Name,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Electrical Equipment Use,SF6 emissions ,Does the facility employ continuous emissions monitoring? +1003708,110000591930,AEP Corporate SF6 Emissions,Columbus,OH,43215,1 Riverside Plaza,WASHINGTON,39.588493,-81.682523,221112,DD,88826.52,88826.52,N +1010640,110006650212,"ALLETE, Inc. Transmission and Distribution System",Duluth,MN,55802,30 West Superior Street,ST. LOUIS COUNTY,46.78608,-92.09926,221122,DD,7736.04,7736.04,N +1010811,110010724216,Ameren Illinois Electric,Peoria,IL,61602,300 Liberty Street,PEORIA COUNTY,40.69048,-89.59244,221122,DD,91298.04,91298.04,N +1010812,110011771948,Ameren Missouri Electric,St. Louis,MO,63103,1901 Chouteau Avenue,SAINT LOUIS CITY,38.620785,-90.211635,221122,DD,14322.96,14322.96,N +1009444,110043470721,American Transmission Company,Waukesha,WI,53188,W234 N2000 Ridgeview Parkway Court,WAUKESHA,43.060408,-88.225005,221121,DD,33518.28,33518.28,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2013_local_distribution.csv b/scripts/us_epa/ghgrp/test_data/input/2013_local_distribution.csv new file mode 100644 index 0000000000..ea5c9cf53d --- /dev/null +++ b/scripts/us_epa/ghgrp/test_data/input/2013_local_distribution.csv @@ -0,0 +1,6 @@ +Facility Id,FRS Id,Facility Name,State where Emissions Occur,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Local Distribution Companies,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? +1008026,110010724216,Ameren Illinois,IL,Peoria,IL,61602,300 Liberty Street,PEORIA COUNTY,40.69048,-89.59244,221210,"NN-LDC,W-LDC",75662.2,1236.7,74425.5,,N +1004034,110011771948,Ameren Missouri,MO,St. Louis,MO,63103,1901 Chouteau Avenue,ST. LOUIS CITY,38.620785,-90.211635,221210,"NN-LDC,W-LDC",13353.6,16.1,13337.5,,N +1004975,110025098249,Arkansas Oklahoma Gas Corp (AR),AR,Fort Smith,AR,72903,5030 South S Street,SEBASTIAN COUNTY,35.36353,-94.37573,221210,"NN-LDC,W-LDC",10821.8,12.8,10809,,N +1006481,110025080267,Arkansas Oklahoma Gas Corp (OK),OK,Fort Smith,AR,72903,5030 South S Street,SEBASTIAN COUNTY,35.36353,-94.37573,221210,"NN-LDC,W-LDC",3111.7,3.7,3108,,N +1007872,110043799654,Atlanta Gas Light Company,GA,Atlanta,GA,30309,Ten Peachtree Place,FULTON COUNTY,33.780708,-84.387782,221210,"NN-LDC,W-LDC",155513.8,177.3,155336.5,,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2013_oil_and_gas.csv b/scripts/us_epa/ghgrp/test_data/input/2013_oil_and_gas.csv deleted file mode 100644 index d2bdcbee32..0000000000 --- a/scripts/us_epa/ghgrp/test_data/input/2013_oil_and_gas.csv +++ /dev/null @@ -1,3 +0,0 @@ -Facility Id,FRS Id,Facility Name,Basin,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported emissions from Onshore Oil & Gas Production ,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? ,Unnamed: 18,Unnamed: 19,Unnamed: 20,Unnamed: 21,Unnamed: 22,Unnamed: 23,Unnamed: 24,Unnamed: 25,Unnamed: 26,Unnamed: 27,Unnamed: 28,Unnamed: 29,Unnamed: 30,Unnamed: 31,Unnamed: 32,Unnamed: 33,Unnamed: 34,Unnamed: 35,Unnamed: 36,Unnamed: 37,Unnamed: 38,Unnamed: 39,Unnamed: 40,Unnamed: 41,Unnamed: 42,Unnamed: 43,Unnamed: 44,Unnamed: 45,Unnamed: 46,Unnamed: 47,Unnamed: 48,Unnamed: 49,Unnamed: 50,Unnamed: 51,Unnamed: 52,Unnamed: 53,Unnamed: 54,Unnamed: 55,Unnamed: 56,Unnamed: 57,Unnamed: 58,Unnamed: 59 -1000355,110002972506,#540 BONANZA CREEK ENERGY - DENVER BASIN,540 - Denver Basin,Denver,CO,80202,"410 17th Street, Suite 1500",DENVER COUNTY,39.74431,-104.98858,211111,W-ONSH,163013.8,59015.6,103953.5,44.7,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, -1008232,110022679485,YPC 535 Green River Basin,535 - Green River Basin,Artesia,NM,88210,105 South Fourth Street,EDDY COUNTY,32.84142,-104.40106,211111,W-ONSH,40908.05,297.3,40610.75,,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file diff --git a/scripts/us_epa/ghgrp/test_data/input/2014_local_distribution.csv b/scripts/us_epa/ghgrp/test_data/input/2014_local_distribution.csv new file mode 100644 index 0000000000..d7fcdeadbc --- /dev/null +++ b/scripts/us_epa/ghgrp/test_data/input/2014_local_distribution.csv @@ -0,0 +1,6 @@ +Facility Id,FRS Id,Facility Name,State where Emissions Occur,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Local Distribution Companies,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? +1008026,110010724216,Ameren Illinois,IL,Peoria,IL,61602,300 Liberty Street,PEORIA COUNTY,40.69048,-89.59244,221210,"NN-LDC,W-LDC",75801.6,1873.1,73928.5,,N +1004034,110011771948,Ameren Missouri,MO,St. Louis,MO,63103,1901 Chouteau Avenue,ST. LOUIS CITY,38.620785,-90.211635,221210,"NN-LDC,W-LDC",13412.6,16.1,13396.5,,N +1004975,110025098249,Arkansas Oklahoma Gas Corp (AR),AR,Fort Smith,AR,72903,5030 South S Street,SEBASTIAN COUNTY,35.36353,-94.37573,221210,"NN-LDC,W-LDC",10870.5,12.5,10858,,N +1006481,110025080267,Arkansas Oklahoma Gas Corp (OK),OK,Fort Smith,AR,72903,5030 South S Street,SEBASTIAN COUNTY,35.36353,-94.37573,221210,"NN-LDC,W-LDC",2447.55,2.8,2444.75,,N +1007872,110043799654,Atlanta Gas Light Company,GA,Atlanta,GA,30309,Ten Peachtree Place,FULTON COUNTY,33.780708,-84.387782,221210,"NN-LDC,W-LDC",155671.85,178.1,155493.75,,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2016_gathering_and_boosting.csv b/scripts/us_epa/ghgrp/test_data/input/2016_gathering_and_boosting.csv index 6e36114a47..47833cb4e7 100644 --- a/scripts/us_epa/ghgrp/test_data/input/2016_gathering_and_boosting.csv +++ b/scripts/us_epa/ghgrp/test_data/input/2016_gathering_and_boosting.csv @@ -1,3 +1,6 @@ -Facility Id,FRS Id,Facility Name,Basin,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported emissions from Gathering & Boosting,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Unnamed: 17,Unnamed: 18,Unnamed: 19,Unnamed: 20,Unnamed: 21,Unnamed: 22,Unnamed: 23,Unnamed: 24,Unnamed: 25,Unnamed: 26,Unnamed: 27,Unnamed: 28,Unnamed: 29,Unnamed: 30,Unnamed: 31,Unnamed: 32,Unnamed: 33,Unnamed: 34,Unnamed: 35,Unnamed: 36,Unnamed: 37,Unnamed: 38,Unnamed: 39,Unnamed: 40,Unnamed: 41,Unnamed: 42,Unnamed: 43,Unnamed: 44,Unnamed: 45,Unnamed: 46,Unnamed: 47,Unnamed: 48,Unnamed: 49,Unnamed: 50,Unnamed: 51,Unnamed: 52,Unnamed: 53,Unnamed: 54,Unnamed: 55,Unnamed: 56,Unnamed: 57,Unnamed: 58 -1012491,110070082322,EGG 350 South Oklahoma Folded Belt GB,350 - South Oklahoma Folded Belt,Oklahoma City,OK,73100,"499 W. Sheridan, Suite 1500",OKLAHOMA COUNTY,35.46646,-97.52124,486210,W-GB,219181.668,174989.4,44038.5,153.768,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, -1012814,110070082511,TOMPC Chautauqua #355-G&B,355 - Chautauqua Platform,Bridgeport,TX,76426,1209 County Road 1304,WISE COUNTY,33.22345,-97.7372,211111,W-GB,51315.808,47713.4,3469.5,132.908,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file +Facility Id,FRS Id,Facility Name,Basin,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported emissions from Gathering & Boosting,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions +1012507,110070082329,220 Gulf Coast Basin,"220 - Gulf Coast Basin (LA, TX)",Houston,TX,77002,"811 Louisiana, Suite 2100",HARRIS COUNTY,29.75993,-95.366413,211111,W-GB,44304.292,16724.9,27570.75,8.642 +1012156,110071161819,260 - East Texas Basin Gathering/Boosting,260 - East Texas Basin,Houston,TX,77079,737 Eldridge Parkway,HARRIS COUNTY,29.77455,-95.61949,211111,W-GB,46921.114,35166.1,11734.75,20.264 +1012155,110071161818,345 - Arkoma Basin Gathering/Boosting,345 - Arkoma Basin,Houston,TX,77079,737 Eldridge Parkway,HARRIS COUNTY,29.77455,-95.61949,211111,W-GB,78994.21,65490.2,13468.25,35.76 +1012472,110070082329,345 Arkoma Basin,345 - Arkoma Basin,Houston,TX,77002,"811 Louisiana, Suite 2100",HARRIS COUNTY,29.75993,-95.366413,211111,W-GB,55733.472,51896.2,3810.75,26.522 +1012466,110070082329,350 South Oklahoma Folded Belt,350 - South Oklahoma Folded Belt,Houston,TX,77002,"811 Louisiana, Suite 2100",HARRIS COUNTY,29.75993,-95.366413,211111,W-GB,177420.494,57531.8,119858,30.694 diff --git a/scripts/us_epa/ghgrp/test_data/input/2016_oil_and_gas.csv b/scripts/us_epa/ghgrp/test_data/input/2016_oil_and_gas.csv new file mode 100644 index 0000000000..dcea223a01 --- /dev/null +++ b/scripts/us_epa/ghgrp/test_data/input/2016_oil_and_gas.csv @@ -0,0 +1,5 @@ +Facility Id,FRS Id,Facility Name,Basin,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported emissions from Onshore Oil & Gas Production ,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? +1000355,,#540 BONANZA CREEK ENERGY - DENVER BASIN,540 - Denver Basin,Denver,CO,80202,"410 17th Street, Suite 1500",,39.74431,-104.98858,211111,W-ONSH,261382.84,154176.7,107115.25,90.89,N +1009263,110071162236,220 Gulf Coast,"220 - Gulf Coast Basin (LA, TX)",Oklahoma City,OK,73114,701 Cedar Lake Blvd,OKLAHOMA COUNTY,35.56719,-97.49827,211111,W-ONSH,3181.694,1730.8,1450,0.894,N +1009238,,220 Gulf Coast Basin DEC,"220 - Gulf Coast Basin (LA, TX)",Oklahoma City,OK,73102,333 West Sheridan Ave,,35.466697,-97.51453,211111,W-ONSH,808767.966,600130.6,208416.25,221.116,N +1009283,,230 Arkla Basin QEP Energy Company,230 - Arkla Basin,Denver,CO,80265,1050 17th Street Unit 800,,39.7480769,-104.994564,211111,W-ONSH,57168.136,12931.4,44219.75,16.986,N diff --git a/scripts/us_epa/ghgrp/test_data/input/2017_local_distribution.csv b/scripts/us_epa/ghgrp/test_data/input/2017_local_distribution.csv deleted file mode 100644 index 254daa54ac..0000000000 --- a/scripts/us_epa/ghgrp/test_data/input/2017_local_distribution.csv +++ /dev/null @@ -1,3 +0,0 @@ -Facility Id,FRS Id,Facility Name,State where Emissions Occur,Reported City,Reported State,Reported Zip Code,Reported Address,Reported County,Reported Latitude,Reported Longitude,Primary NAICS Code,Industry Type (subparts),Total reported direct emissions from Local Distribution Companies,CO2 emissions (non-biogenic) ,Methane (CH4) emissions ,Nitrous Oxide (N2O) emissions ,Does the facility employ continuous emissions monitoring? ,Unnamed: 18,Unnamed: 19,Unnamed: 20,Unnamed: 21,Unnamed: 22,Unnamed: 23,Unnamed: 24,Unnamed: 25,Unnamed: 26,Unnamed: 27,Unnamed: 28,Unnamed: 29,Unnamed: 30,Unnamed: 31,Unnamed: 32,Unnamed: 33,Unnamed: 34,Unnamed: 35,Unnamed: 36,Unnamed: 37,Unnamed: 38,Unnamed: 39,Unnamed: 40,Unnamed: 41,Unnamed: 42,Unnamed: 43,Unnamed: 44,Unnamed: 45,Unnamed: 46,Unnamed: 47,Unnamed: 48,Unnamed: 49,Unnamed: 50,Unnamed: 51,Unnamed: 52,Unnamed: 53,Unnamed: 54,Unnamed: 55,Unnamed: 56,Unnamed: 57,Unnamed: 58,Unnamed: 59 -1001277,110043952283,NSTAR Gas Company,MA,Westwood,MA,02090,1 NSTAR Way,NORFOLK COUNTY,42.20446,-71.15937,221210,"NN-LDC,W-LDC",110810.65,133.4,110677.25,6392,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, -1011115,110010642073,"West Texas Gas, Inc.",TX,Midland,TX,79701,211 North Colorado,MIDLAND COUNTY,31.99906,-102.07688,221210,"NN-LDC,W-LDC",33870.3,40.8,33829.5,,N,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,, \ No newline at end of file diff --git a/scripts/us_epa/ghgrp/test_data/input/crosswalks.csv b/scripts/us_epa/ghgrp/test_data/input/crosswalks.csv index 1f8762cf57..cae802a43d 100644 --- a/scripts/us_epa/ghgrp/test_data/input/crosswalks.csv +++ b/scripts/us_epa/ghgrp/test_data/input/crosswalks.csv @@ -1,13 +1,10 @@ Facility Id,FRS Id,ORIS CODE,ORIS CODE 2,ORIS CODE 3,ORIS CODE 4,ORIS CODE 5 -1000112,110019827286,7910,,,, -1000355,110002972506,,,,, -1001277,110043952283,,,,, -1004377,110043803578,,,,, -1007606,110000597729,,,,, -1009620,110017609346,,,,, -1010527,110049258772,,,,, -1011115,110010642073,,,,, -1011696,110064007550,,,,, -1011696,110064007550,,,,, -1012491,110070082322,,,,, -1012814,110070082511,,,,, \ No newline at end of file +1000011,110000807379,,,,, +1000054,110071160313,,,,, +1000091,110071159598,581,,,, +1000205,110071161799,,,,, +1000326,110043797585,,,,, +1000355,,,,,, +1000388,110071160900,,,,, +1000435,,,,,, +1000507,110035420719,50865,,,,