"""Metadata and operational constants."""
from typing import Any, Dict
from pudl.metadata.constants import CONTRIBUTORS, KEYWORDS, LICENSES
from pudl.metadata.enums import EPACEMS_STATES
[docs]SOURCES: Dict[str, Any] = {
"censusdp1tract": {
"title": "Census DP1",
"path": "https://www.census.gov/geographies/mapping-files/2010/geo/tiger-data.html",
"description": (
"US Census Demographic Profile 1 (DP1) County and Tract "
"GeoDatabase."
),
"working_partitions": {}, # Census DP1 is monolithic.
"keywords": sorted(set(
[
"censusdp1tract",
"census",
]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"eia860": {
"title": "EIA Form 860",
"path": "https://www.eia.gov/electricity/data/eia860",
"description": (
"US Energy Information Administration (EIA) Form 860 data for "
"electric power plants with 1 megawatt or greater combined nameplate "
"capacity."
),
"field_namespace": "eia",
"contributors": [
CONTRIBUTORS["catalyst-cooperative"],
CONTRIBUTORS["zane-selvans"],
CONTRIBUTORS["christina-gosnell"],
CONTRIBUTORS["steven-winter"],
CONTRIBUTORS["alana-wilson"],
],
"working_partitions": {
"years": sorted(set(range(2001, 2021))),
},
"keywords": sorted(set(
[
"eia860",
"form 860",
"ownership",
"annual",
"yearly",
]
+ KEYWORDS["eia"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
+ KEYWORDS["fuels"]
+ KEYWORDS["plants"]
+ KEYWORDS["environment"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"eia860m": {
"title": "EIA Form 860m",
"path": "https://www.eia.gov/electricity/data/eia860m",
"description": (
"US Energy Information Administration (EIA) Form 860 M data for "
"electric power plants with 1 megawatt or greater combined nameplate "
"capacity. Preliminary Monthly Electric Generator Inventory (based on "
"Form EIA-860M as a supplement to Form EIA-860)"
),
"field_namespace": "eia",
"contributors": [],
"working_partitions": {
"year_month": "2021-12",
},
"keywords": sorted(set(
[
"eia860m",
"form 860m",
"monthly",
]
+ KEYWORDS["eia"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
+ KEYWORDS["fuels"]
+ KEYWORDS["plants"]
+ KEYWORDS["environment"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"eia861": {
"title": "EIA Form 861: Annual Electric Power Industry Report",
"path": "https://www.eia.gov/electricity/data/eia861",
"description": (
"EIA Form 861 Annual Electric Power Industry Report, detailed "
"data files."
),
"field_namespace": "eia",
"working_partitions": {
"years": sorted(set(range(2001, 2021))),
},
"contributors": [],
"keywords": sorted(set(
[
"eia861",
"form 861",
"balancing authority",
"advanced metering infrastructure",
"customer class",
"green pricing",
"energy efficiency",
"demand side management",
"demand response",
"net metering",
"business model",
"service territory",
"annual",
"yearly",
]
+ KEYWORDS["eia"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"eia923": {
"title": "EIA Form 923",
"path": "https://www.eia.gov/electricity/data/eia923",
"description": (
"The EIA Form 923 collects detailed monthly and annual electric "
"power data on electricity generation, fuel consumption, fossil fuel "
"stocks, and receipts at the power plant and prime mover level."
),
"field_namespace": "eia",
"working_partitions": {
"years": sorted(set(range(2001, 2021))),
},
"contributors": [
CONTRIBUTORS["catalyst-cooperative"],
CONTRIBUTORS["zane-selvans"],
CONTRIBUTORS["christina-gosnell"],
CONTRIBUTORS["steven-winter"],
CONTRIBUTORS["katherine-lamb"],
],
"keywords": sorted(set(
[
"eia923",
"form 923",
"monthly",
]
+ KEYWORDS["eia"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
+ KEYWORDS["fuels"]
+ KEYWORDS["plants"]
+ KEYWORDS["environment"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"eiawater": {
"title": "EIA Thermoelectric Cooling Water",
"path": "https://www.eia.gov/electricity/data/water",
"description": (
"Monthly cooling water usage by generator and boiler. Data "
"collected in conjunction with the EIA-860 and EIA-923."
),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"epacems": {
"title": "EPA Hourly Continuous Emission Monitoring System (CEMS)",
"path": "https://ampd.epa.gov/ampd",
"description": (
"US EPA hourly Continuous Emissions Monitoring System (CEMS) data."
),
"field_namespace": "epacems",
"working_partitions": {
"years": sorted(set(range(1995, 2021))),
"states": sorted(set(EPACEMS_STATES)),
},
"contributors": [
CONTRIBUTORS["catalyst-cooperative"],
CONTRIBUTORS["karl-dunkle-werner"],
CONTRIBUTORS["zane-selvans"],
],
"keywords": sorted(set(
[
"continuous emissions monitoring system",
"cems",
"air markets program data",
"ampd",
"hourly",
]
+ KEYWORDS["epa"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
+ KEYWORDS["environment"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"ferc1": {
"title": "FERC Form 1",
"path": "https://www.ferc.gov/industries-data/electric/general-information/electric-industry-forms/form-1-electric-utility-annual",
"description": (
"The Federal Energy Regulatory Commission (FERC) Form 1 is a "
"comprehensive financial and operating report submitted annually for "
"electric rate regulation, market oversight analysis, and financial audits "
"by Major electric utilities, licensees and others."
),
"field_namespace": "ferc1",
"working_partitions": {
"years": sorted(set(range(1994, 2021))),
},
"contributors": [
CONTRIBUTORS["catalyst-cooperative"],
CONTRIBUTORS["zane-selvans"],
CONTRIBUTORS["christina-gosnell"],
CONTRIBUTORS["steven-winter"],
CONTRIBUTORS["alana-wilson"],
CONTRIBUTORS["austen-sharpe"],
],
"keywords": sorted(set(
[
"form 1",
"ferc1",
]
+ KEYWORDS["ferc"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["finance"]
+ KEYWORDS["electricity"]
+ KEYWORDS["plants"]
+ KEYWORDS["fuels"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"ferc2": {
"title": "FERC Form 2",
"path": "https://www.ferc.gov/industries-data/natural-gas/industry-forms/form-2-2a-3-q-gas-historical-vfp-data",
"description": (
"The Federal Energy Regulatory Commission (FERC) Form 2 is a "
"comprehensive financial and operating report submitted for natural gas "
"pipelines rate regulation and financial audits."
),
"field_namespace": "ferc2",
"working_partitions": {
"years": [], # Not yet working!
},
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"ferc714": {
"title": "FERC Form 714: Annual Electric Balancing Authority Area and Planning Area Report",
"path": "https://www.ferc.gov/industries-data/electric/general-information/electric-industry-forms/form-no-714-annual-electric",
"description": (
"Electric transmitting utilities operating balancing authority "
"areas and planning areas with annual peak demand over 200MW are required "
"to file Form 714 with the Federal Energy Regulatory Commission (FERC), "
"reporting balancing authority area generation, actual and scheduled "
"inter-balancing authority area power transfers, and net energy for load, "
"summer-winter generation peaks and system lambda."
),
"field_namespace": "ferc714",
"working_partitions": {}, # Data is monolitic, one file with all years.
"keywords": sorted(set(
[
"form 714",
"ferc714",
]
+ KEYWORDS["ferc"]
+ KEYWORDS["us_govt"]
+ KEYWORDS["electricity"]
)),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"ferceqr": {
"title": "FERC Form 920: Electric Quarterly Report (EQR)",
"path": "https://www.ferc.gov/industries-data/electric/power-sales-and-markets/electric-quarterly-reports-eqr",
"description": (
"The EQR contains Seller-provided data summarizing contractual terms and "
"conditions in agreements for all jurisdictional services, including "
"cost-based sales, market-based rate sales, and transmission service, "
"as well as transaction information for short-term and long-term "
"market-based power sales and cost-based power sales."
),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"mshamines": {
"title": "Mine Safety and Health Administration (MSHA) Mines",
"path": "https://arlweb.msha.gov/OpenGovernmentData/OGIMSHA.asp",
"description": (
"The Mine dataset lists all Coal and Metal/Non-Metal mines under MSHA's "
"jurisdiction. It includes such information as the current status of each "
"mine (Active, Abandoned, NonProducing, etc.), the current owner and "
"operating company, commodity codes and physical attributes of the mine."
),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"phmsagas": {
"title": "Pipelines and Hazardous Materials Safety Administration (PHMSA) Annual Natural Gas Report",
"path": "https://www.phmsa.dot.gov/data-and-statistics/pipeline/gas-distribution-gas-gathering-gas-transmission-hazardous-liquids",
"description": (
"Annual reports submitted to PHMSA from gas distribution, gas gathering, "
"gas transmission, liquefied natural gas, and underground gas storage "
"system operators. Annual reports include information such as total "
"pipeline mileage, facilities, commodities transported, miles by material, "
"and installation dates."
),
"license_raw": LICENSES["us-govt"],
"license_pudl": LICENSES["cc-by-4.0"],
},
"pudl": {
"title": "The Public Utility Data Liberation (PUDL) Project",
"path": "https://catalyst.coop/pudl",
"description": (
"PUDL is a data processing pipeline created by Catalyst Cooperative that "
"cleans, integrates, and standardizes some of the most widely used public "
"energy datasets in the US. The data serve researchers, activists, "
"journalists, and policy makers that might not have the technical expertise "
"to access it in its raw form, the time to clean and prepare the data for "
"bulk analysis, or the means to purchase it from existing commercial "
"providers."
),
"contributors": [
CONTRIBUTORS["catalyst-cooperative"],
CONTRIBUTORS["zane-selvans"],
CONTRIBUTORS["christina-gosnell"],
CONTRIBUTORS["steven-winter"],
],
"field_namespace": "pudl",
"keywords": ["us", "electricity", "open data", "open source"],
"license_raw": LICENSES["cc-by-4.0"],
"license_pudl": LICENSES["cc-by-4.0"],
"email": "pudl@catalyst.coop",
},
}
"""
Data source attributes by PUDL identifier.
"""