-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_full_pipeline_all_sites.sh
executable file
·45 lines (39 loc) · 1.63 KB
/
run_full_pipeline_all_sites.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
#!/bin/bash
# server-level pipeline script for all daily journal data flow/QC processing (audio and transcript sides)
# should be called with path to folder that contains a config file for each site to be processed
if [[ -z "${1}" ]]; then
echo "Please provide a path to folder of site configs"
exit
fi
configs_path=$1
# get path this script is in to find repo root
full_path=$(realpath $0)
repo_root=$(dirname $full_path)
# run audio side code for each config
for file in "$configs_path"/*.sh; do
bash "$repo_root"/site_level_pipeline_branches/audio_side.sh "$file"
# add spacing for when monitoring logs in real time
echo ""
echo ""
echo ""
done
# run transcript side code for each config
for file in "$configs_path"/*.sh; do
bash "$repo_root"/site_level_pipeline_branches/transcript_side.sh "$file"
# add spacing for when monitoring logs in real time
echo ""
echo ""
echo ""
done
# finally call the part of the pipeline that will do subject-level summaries for each site
# (e.g. flagging possible issues as needed, doing some merging of CSVs from across audio and transcript sides)
for file in "$configs_path"/*.sh; do
bash "$repo_root"/site_level_pipeline_branches/subject_summaries_update.sh "$file"
# add spacing for when monitoring logs in real time
echo ""
echo ""
echo ""
done
# note that any setup of basic dependencies and permissions will be done for each server separately in the cron scripts under ampscz_diaries_launch
# within that script it will simply call this high level wrapper to do the core pipeline work
# main cron script should also then call the server-wide summary stats module at the top level of this repo as well