30 lines
631 B
Bash
30 lines
631 B
Bash
#!/bin/bash
|
|
#SBATCH -A p32852
|
|
#SBATCH -p gengpu
|
|
#SBATCH --gres=gpu:a100:1
|
|
#SBATCH --nodes=2
|
|
#SBATCH --ntasks-per-node=1
|
|
#SBATCH --time=24:00:00
|
|
#SBATCH --mem=64G
|
|
#SBATCH --cpus-per-task=4
|
|
#SBATCH --job-name=SLR_OCR
|
|
#SBATCH --output=slr_ocr_logs.log
|
|
#SBATCH --mail-type=BEGIN,END,FAIL
|
|
#SBATCH --mail-user=gaughan@u.northwestern.edu
|
|
|
|
echo "setting up the environment"
|
|
|
|
module purge
|
|
eval "$(conda shell.bash hook)"
|
|
conda activate olmocr
|
|
|
|
echo "running the pdf to json ocr conversion"
|
|
|
|
python -m olmocr.pipeline ./studies_json --pdfs ./studies_pdf/*.pdf
|
|
|
|
echo "job finished, cleaning up"
|
|
|
|
conda deactivate
|
|
|
|
echo "job pau at: $(date)"
|