-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfile_collecting.py
38 lines (29 loc) · 1.29 KB
/
file_collecting.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
from glob import glob
import pandas as pd
import os
import shutil
folder_path = 'C:/Users/Hoan/Documents/policeoutcomedata'
street_files_1 = glob('C:/Users/Hoan/Documents/Advanced data management/**/*city-of-london-street.csv', recursive=True)
street_files_2 = glob('C:/Users/Hoan/Documents/Advanced data management/**/*metropolitan-street.csv', recursive=True)
outcome_files_1 = glob('C:/Users/Hoan/Documents/Advanced data management/**/*city-of-london-outcomes.csv', recursive=True)
outcome_files_2 = glob('C:/Users/Hoan/Documents/Advanced data management/**/*metropolitan-outcomes.csv', recursive=True)
street_files = street_files_1 + street_files_2
street_files.sort()
outcome_files = outcome_files_1 + outcome_files_2
outcome_files.sort()
for r in outcome_files:
shutil.copy(r, folder_path)
# df_list = []
# for r in street_files:
# df = pd.read_csv(r)
# df_list.append(df)
# big_df = pd.concat(df_list, ignore_index=True)
# big_df.to_csv(os.path.join(folder_path, 'street-data.csv'), index=False)
# outcome_files = outcome_files_1 + outcome_files_2
# outcome_files.sort()
# df_list = []
# for r in outcome_files:
# df = pd.read_csv(r)
# df_list.append(df)
# big_df = pd.concat(df_list, ignore_index=True)
# big_df.to_csv(os.path.join(folder_path, 'outcomes-data.csv'), index=False)