Skip to content

Commit 6e6f3f2

Browse files
committed
added todo for cogstack2csv
1 parent 904d012 commit 6e6f3f2

File tree

1 file changed

+31
-0
lines changed

1 file changed

+31
-0
lines changed

cogstack.py

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,5 +96,36 @@ def cogstack2df(self, query: Dict, index: str, column_headers=None, es_gen_size:
9696
else:
9797
df = pd.DataFrame(temp_results)
9898
return df
99+
100+
""" TODO create autosave function
101+
# Construct a df
102+
search_results_filename = 'search_results.csv' # change output filename
103+
temp_results = []
104+
counter = 0
105+
save_interator = 5000 # saves every x hits
106+
df_headers = ['_index', '_type', '_id', '_score']
107+
df_headers.extend(columns)
108+
109+
with open(search_results_filename, 'a') as f_object:
110+
writer_object = writer(f_object)
111+
writer_object.writerow(df_headers)
112+
for hit in search_results:
113+
if counter % save_interator == 0:
114+
writer_object.writerows(temp_results)
115+
temp_results = []
116+
print(f'Saved {save_interator} docs')
117+
row = {}
118+
row['_index'] = hit['_index']
119+
row['_type'] = hit['_type']
120+
row['_id'] = hit['_id']
121+
row['_score'] = hit['_score']
122+
row.update(hit['_source'])
123+
temp_results.append(row.values())
124+
counter += 1
125+
126+
writer_object.writerows(temp_results)
127+
temp_results = []
128+
f_object.close()
129+
"""
99130

100131

0 commit comments

Comments
 (0)