Skip to content

Commit 05bffea

Browse files
committed
use lag and issue from csv file
1 parent 2395b48 commit 05bffea

File tree

3 files changed

+12
-13
lines changed

3 files changed

+12
-13
lines changed

integrations/acquisition/covidcast_nowcast/test_csv_uploading.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -75,8 +75,8 @@ def test_uploading(self):
7575

7676
# valid
7777
with open(receiving_dir + '20200419_state_sig.csv', 'w') as f:
78-
f.write('sensor_name,geo_value,value\n')
79-
f.write('testsensor,ca,1\n')
78+
f.write('sensor_name,geo_value,value,lag,issue\n')
79+
f.write('testsensor,ca,1,2,20200421\n')
8080

8181
# invalid filename
8282
with open(receiving_dir + 'hello.csv', 'w') as f:
@@ -129,12 +129,12 @@ def test_duplicate_row(self):
129129
os.makedirs(receiving_dir, exist_ok=True)
130130

131131
with open(receiving_dir + '20200419_state_sig.csv', 'w') as f:
132-
f.write('sensor_name,geo_value,value\n')
133-
f.write('testsensor,ca,1\n')
132+
f.write('sensor_name,geo_value,value,lag,issue\n')
133+
f.write('testsensor,ca,1,2,20200415\n')
134134
main()
135135
with open(receiving_dir + '20200419_state_sig.csv', 'w') as f:
136-
f.write('sensor_name,geo_value,value\n')
137-
f.write('testsensor,ca,2\n')
136+
f.write('sensor_name,geo_value,value,lag,issue\n')
137+
f.write('testsensor,ca,2,2,20200415\n')
138138
main()
139139

140140
# most most recent value is the one stored
@@ -146,7 +146,7 @@ def test_duplicate_row(self):
146146
'time_value': 20200419,
147147
'geo_value': 'ca',
148148
'value': 2,
149-
'issue': 20200421,
149+
'issue': 20200415,
150150
'lag': 2,
151151
'signal': 'sig',
152152
}],

src/acquisition/covidcast_nowcast/load_sensors.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
FAIL_DIR = "archive/failed"
1313
TABLE_NAME = "covidcast_nowcast"
1414
DB_NAME = "epidata"
15-
CSV_DTYPES = {"sensor_name": str, "geo_value": str, "value": float}
15+
CSV_DTYPES = {"sensor_name": str, "geo_value": str, "value": float, "lag": int, "issue": int}
1616

1717

1818
def main(csv_path: str = SENSOR_CSV_PATH) -> None:
@@ -75,8 +75,7 @@ def load_and_prepare_file(filepath: str, attributes: tuple) -> pd.DataFrame:
7575
data["time_type"] = time_type
7676
data["geo_type"] = geo_type
7777
data["time_value"] = time_value
78-
data["issue"] = issue_value
79-
data["lag"] = lag_value
78+
# we don't use the lag and issue calculation since it's specified in the data.
8079
data["value_updated_timestamp"] = int(time.time())
8180
return data
8281

tests/acquisition/covidcast_nowcast/test_load_sensors.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,17 +28,17 @@ def test_load_and_prepare_file(self):
2828
"test_issue_value",
2929
"test_lag_value")
3030

31-
test_df = load_and_prepare_file(StringIO("sensor_name,geo_value,value\ntestname,01001,1.5"), test_attributes)
31+
test_df = load_and_prepare_file(StringIO("sensor_name,geo_value,value,lag,issue\ntestname,01001,1.5,2,20200101"), test_attributes)
3232
pd.testing.assert_frame_equal(test_df,
3333
pd.DataFrame({"sensor_name": ["testname"],
3434
"geo_value": ["01001"],
3535
"value": [1.5],
36+
"lag": [2],
37+
"issue": [20200101],
3638
"source": ["test_source"],
3739
"signal": ["test_signal"],
3840
"time_type": ["test_time_type"],
3941
"geo_type": ["test_geo_type"],
4042
"time_value": ["test_time_value"],
41-
"issue": ["test_issue_value"],
42-
"lag": ["test_lag_value"],
4343
"value_updated_timestamp": [12345]})
4444
)

0 commit comments

Comments
 (0)