-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathcreateJobs.sh
More file actions
17 lines (12 loc) · 775 Bytes
/
createJobs.sh
File metadata and controls
17 lines (12 loc) · 775 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
# should be run from ChtcRun directory
filepath="/home/iaross/DeepDive/downloads/"
# clean up journal name, removing commas and spaces
journal=$1
tag=$2
journal_clean=${journal//,/}
journal_clean=${journal_clean// /_}
python ../deepdive/pdf_to_dag.py "$filepath$journal" "$journal_clean"$tag
# assume ChtcRun/shared exists and holds all common shared junk
cp -r shared "$journal_clean""$tag"
echo "Submit directories prepared! Use mkdag to create the DAGs, passing relevant runtime arguments. e.g.:"
echo ./mkdag --cmdtorun=ocr_pdf.py --parg=input.pdf --parg="--cuneiform" --parg="--tesseract" --data=$journal_clean$tag --outputdir="$journal_clean""$tag"_out --pattern=*.html --type=other