13
0
cdsc_reddit/density/job_script.sh

5 lines
311 B
Bash
Raw Permalink Normal View History

#!/usr/bin/bash
start_spark_cluster.sh
2021-02-23 00:03:48 +00:00
spark-submit --master spark://$(hostname):18899 overlap_density.py authors --inpath=/gscratch/comdata/output/reddit_similarity/comment_authors_10000.feather --outpath=/gscratch/comdata/output/reddit_density/comment_authors_10000.feather --agg=pd.DataFrame.sum
stop-all.sh