-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrun-workflow
More file actions
executable file
·30 lines (20 loc) · 1.29 KB
/
Copy pathrun-workflow
File metadata and controls
executable file
·30 lines (20 loc) · 1.29 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash
# Sanity check that data and data/raw exist to process Twitter data
[ ! -e "data" ] && echo " [ ERROR ] No data to process" && exit 1
[ ! -e "data/raw" ] && echo " [ ERROR ] No raw data to process" && exit 1
# If 'out' directory does not exist, then create it
[ ! -e "out" ] && mkdir out
# If 'csv' directory does not exist, then create it
[ ! -e "csv" ] && mkdir csv
# Take the 35+ million raw tweets and extract geo-enabled tweets
#time ./workflow-raw-to-geo.py >> out/out.workflow-raw-to-geo
# Take the geo-enabled tweets and find all those that mention "Ebola"
#time ./workflow-geo-to-geoebola.py >> out/out.workflow-geo-to-geoebola
# Take the geo-enabled tweets that mention Ebola and extract those near different sites
#time ./workflow-geoebola-to-sites.py >> out/out.workflow-geoebola-to-sites
# Take each site and apply TIC. Results are saved to 'csv' directory.
time ./workflow-sites-to-tic.py >> out/out.workflow-sites-to-tic
# Take each site and apply Behavior Response scripts. Results are saved to 'csv' directory.
#time ./workflow-sites-to-bresponse.py >> out/out.workflow-sites-to-bresponse
# Take geo-enabled tweets that mention Ebola and extract the locations, which are saved as a csv file
#time ./workflow-geoebola-to-geocsv.py >> out/out.workflow-geoebola-to-geocsv