handle case where we're in a parent directory.
This commit is contained in:
parent
a84b633641
commit
a0a6a08bf2
@ -222,11 +222,16 @@ def gen_task_list(mwe_pass='first',
|
|||||||
dataset='comments'):
|
dataset='comments'):
|
||||||
files = os.listdir(input_parquet)
|
files = os.listdir(input_parquet)
|
||||||
|
|
||||||
with open("tf_task_list",'w') as outfile:
|
|
||||||
curdir = Path('.')
|
curdir = Path('.')
|
||||||
|
if curdir.absolute().name == 'cdsc_reddit':
|
||||||
|
curdir = str(curdir.absolute())
|
||||||
|
else:
|
||||||
|
curdir = str(curdir.absolute() / "cdsc_reddit")
|
||||||
|
with open("tf_task_list",'w') as outfile:
|
||||||
|
|
||||||
for f in files:
|
for f in files:
|
||||||
if f.endswith(".parquet"):
|
if f.endswith(".parquet"):
|
||||||
outfile.write(f"{str(curdir.absolute())}/term_frequencies.py weekly_tf {f} --mwe-pass {mwe_pass} --input-parquet {input_parquet} --output-01p-sample-path {output_10p_sample_path} --temp-output-tfidf-path {temp_output_tfidf_path} --output-terms-path {output_terms_path} --output-authors-path {output_terms_path} --dataset {dataset}\n")
|
outfile.write(f"{curdir}/term_frequencies.py weekly_tf {f} --mwe-pass {mwe_pass} --input-parquet {input_parquet} --output-01p-sample-path {output_10p_sample_path} --temp-output-tfidf-path {temp_output_tfidf_path} --output-terms-path {output_terms_path} --output-authors-path {output_terms_path} --dataset {dataset}\n")
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
fire.Fire({"gen_task_list":gen_task_list,
|
fire.Fire({"gen_task_list":gen_task_list,
|
||||||
|
Loading…
Reference in New Issue
Block a user