-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathmake_data_sets.py
105 lines (101 loc) · 5.98 KB
/
make_data_sets.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
# Create a DataSet object for each of the programs we track.
# Initialize each one with the information it needs to do its query
# of the database.
# Store the DataSet objects in a dictionary with keys being the
# friendly names of the program, which will be used in selection
# widgets.
# In the following line, 'from DataSet' refers to the file DataSet.py
# while 'import DataSet' refers to the DataSet class within DataSet.py.
from ECHO_modules.DataSet import DataSet
def make_data_sets():
data_sets = {}
ds = DataSet( name='RCRA Violations', idx_field='ID_NUMBER',
table_name='RCRA_VIOLATIONS', echo_type="RCRA",
date_field='DATE_VIOLATION_DETERMINED', date_format='%m/%d/%Y')
data_sets[ ds.name ] = ds
ds = DataSet( name='RCRA Inspections', idx_field='ID_NUMBER',
table_name='RCRA_EVALUATIONS', echo_type="RCRA",
date_field='EVALUATION_START_DATE', date_format='%m/%d/%Y')
data_sets[ ds.name ] = ds
ds = DataSet( name='RCRA Enforcements', echo_type="RCRA",
table_name='RCRA_ENFORCEMENTS', idx_field='ID_NUMBER',
date_field='EVALUATION_START_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
# Special sql queries needed for Air Inspections and Air Enforcements
my_sql = "select * from `ICIS_FEC_EPA_INSPECTIONS` where REGISTRY_ID in "
ds = DataSet( name='Air Inspections', echo_type="AIR",
table_name='ICIS_FEC_EPA_INSPECTIONS', idx_field='REGISTRY_ID',
date_field='ACTUAL_END_DATE', date_format='%m/%d/%Y', sql=my_sql )
data_sets[ ds.name ] = ds
my_sql = "select * from `CASE_FACILITIES` CF, `CASE_ENFORCEMENTS` CE " + \
" where CE.HQ_DIVISION = 'AIR' and CE.CASE_NUMBER = CF.CASE_NUMBER and " + \
" CF.REGISTRY_ID in "
ds = DataSet( name='Air Enforcements', echo_type="AIR",
table_name='CASE_ENFORCEMENTS', idx_field='REGISTRY_ID',
date_field='FISCAL_YEAR', date_format='%Y', sql=my_sql )
data_sets[ ds.name ] = ds
ds = DataSet( name='Air Violations', echo_type="AIR",
table_name='ICIS-AIR_VIOLATION_HISTORY', idx_field='pgm_sys_id',
date_field='HPV_DAYZERO_DATE', date_format='%m-%d-%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='Air Formal Actions', echo_type="AIR",
table_name='ICIS-AIR_FORMAL_ACTIONS', idx_field='pgm_sys_id',
date_field='SETTLEMENT_ENTERED_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='Air Compliance', echo_type="AIR",
table_name='ICIS-AIR_FCES_PCES', idx_field='PGM_SYS_ID',
date_field='ACTUAL_END_DATE', date_format='%m-%d-%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='Combined Air Emissions', echo_type=["GHG","TRI"],
table_name='POLL_RPT_COMBINED_EMISSIONS', idx_field='REGISTRY_ID',
date_field='REPORTING_YEAR', date_format='%Y' )
data_sets[ ds.name ] = ds
my_sql = "select * from `POLL_RPT_COMBINED_EMISSIONS` " + \
" where PGM_SYS_ACRNM = 'E-GGRT' and REGISTRY_ID in "
ds = DataSet( name='Greenhouse Gases', echo_type="GHG",
table_name='POLL_RPT_COMBINED_EMISSIONS', idx_field='REGISTRY_ID',
date_field='REPORTING_YEAR', date_format='%Y', sql = my_sql )
data_sets[ ds.name ] = ds
my_sql = "select * from `POLL_RPT_COMBINED_EMISSIONS` " + \
" where PGM_SYS_ACRNM = 'TRIS' and REGISTRY_ID in "
ds = DataSet( name='Toxic Releases', echo_type="TRI",
table_name='POLL_RPT_COMBINED_EMISSIONS', idx_field='REGISTRY_ID',
date_field='REPORTING_YEAR', date_format='%Y', sql = my_sql )
data_sets[ ds.name ] = ds
ds = DataSet( name='Water Quarterly Violations', echo_type="NPDES",
table_name='NPDES_QNCR_HISTORY', idx_field='NPDES_ID',
date_field='YEARQTR', date_format='%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='Clean Water Inspections', echo_type="NPDES",
table_name='NPDES_INSPECTIONS', idx_field='NPDES_ID',
date_field='ACTUAL_END_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='Clean Water Enforcements', echo_type="NPDES",
table_name='NPDES_FORMAL_ENFORCEMENT_ACTIONS', idx_field='NPDES_ID',
date_field='SETTLEMENT_ENTERED_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Site Visits', echo_type="SDWA",
table_name='SDWA_SITE_VISITS', idx_field='PWSID',
date_field='SITE_VISIT_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Enforcements', echo_type="SDWA",
table_name='SDWA_ENFORCEMENTS', idx_field='PWSID',
date_field='ENFORCEMENT_DATE', date_format='%m/%d/%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Public Water Systems', echo_type="SDWA",
table_name='SDWA_PUB_WATER_SYSTEMS', idx_field='PWSID',
date_field='FISCAL_YEAR', date_format='%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Violations', echo_type="SDWA",
table_name='SDWA_VIOLATIONS', idx_field='PWSID',
date_field='FISCAL_YEAR', date_format='%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Serious Violators', echo_type="SDWA",
table_name='SDWA_SERIOUS_VIOLATORS', idx_field='PWSID',
date_field='FISCAL_YEAR', date_format='%Y' )
data_sets[ ds.name ] = ds
ds = DataSet( name='SDWA Return to Compliance', echo_type="SDWA",
table_name='SDWA_RETURN_TO_COMPLIANCE', idx_field='PWSID',
date_field='FISCAL_YEAR', date_format='%Y' )
data_sets[ ds.name ] = ds
return data_sets