-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathfile_updates.py
104 lines (86 loc) · 3.07 KB
/
file_updates.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
# !/usr/bin/env python
# -*- coding: utf-8 -*-
import json
import logging
import os
from datetime import datetime, timedelta
from time import strftime
import requests
import mail_script
total_pages = 1
page = 1
tomorrow = datetime.today() + timedelta(1)
yesterday = datetime.today() - timedelta(1)
fec_params = {
'api_key': os.environ['FEC_API_KEY'],
'min_receipt_date': yesterday.strftime("%Y-%m-%d"),
'max_receipt_date': tomorrow.strftime("%Y-%m-%d"),
'page': 1,
}
# replace with DB
filing_dict ={}
base_url = 'https://api.open.fec.gov/v1/filings/?sort=-receipt_date&per_page=100'
def analize_file_num(num):
if num is None:
return ''
if num and float(num) > 0:
return num
return ''
def analize_file(num, pdf):
if num and float(num) > 0:
return 'http://docquery.fec.gov/dcdev/posted/{0}.fec'.format(num)
else:
return pdf
def read_results(results):
for r in results:
result = {
'sub_id': r['sub_id'], # primary key
'document_description': r['document_description'],
'committee_id': r['committee_id'],
'committee_name': r['committee_name'],
'candidate_name': r['candidate_name'],
'file_number': r['file_number'],
'amendment_indicator': r['amendment_indicator'],
'report_type': r['report_type'],
'report_type_full': r['report_type_full'],
'total_receipts': r['total_receipts'],
'total_disbursements': r['total_disbursements'],
'total_independent_expenditures': r['total_independent_expenditures'],
'receipt_date': r['receipt_date'],
'coverage_start_date': r['coverage_start_date'],
'coverage_end_date': r['coverage_end_date'],
'pages': r['pages'],
'fec_url': 'http://docquery.fec.gov/dcdev/posted/{0}.fec'.format(r['file_number']),
'pdf_url': r['pdf_url'],
'url': analize_file(r['file_number'], r['pdf_url']),
'show_file_num': analize_file_num(r['file_number']),
}
if r['committee_id'] in filing_dict:
filing_dict[r['committee_id']].append(result)
else:
filing_dict[r['committee_id']] = [result]
return fec_params
# fetch filings
while total_pages >= page:
filings = requests.get(base_url, params=fec_params).json()
if 'results' in filings:
read_results(filings['results'])
page = filings['pagination']['pages']
else: break
# look up users
results = []
# fetch record by committee_id
for committee_id in filing_dict:
info = {
'committee_name': filing_dict[committee_id][0]['committee_name'] or '',
'committee_id': committee_id,
'candidate_name': filing_dict[committee_id][0]['candidate_name'] or '',
'filings': filing_dict[committee_id]
}
results.append(info)
template_data = {
'date': yesterday.strftime('%b %d, %Y'),
'committees': results,
}
server = mail_script.email_log_in()
mail_script.mail_update(server, template_data, os.environ['ADMIN_EMAIL'])