From e568ee6db75878b09ed020f8d18a1b3b521dc0b0 Mon Sep 17 00:00:00 2001 From: Nathan TeBlunthuis Date: Sun, 12 Jan 2025 00:47:47 -0800 Subject: [PATCH] add parameters. --- similarities/weekly_cosine_similarities.py | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/similarities/weekly_cosine_similarities.py b/similarities/weekly_cosine_similarities.py index 0b18dca..a8f39d7 100755 --- a/similarities/weekly_cosine_similarities.py +++ b/similarities/weekly_cosine_similarities.py @@ -147,7 +147,7 @@ def author_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/ clusters=clusters ) -def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', min_df=None, max_df=None, included_subreddits=None, topN=None, static_tfidf_path=None, clusters=None): +def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', min_df=None, max_df=None, included_subreddits=None, topN=None, static_tfidf_path=None, clusters=None,term_ids=None): return cosine_similarities_weekly(infile, outfile, 'term', @@ -156,10 +156,11 @@ def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/re included_subreddits, topN, static_tfidf_path=static_tfidf_path, - clusters=clusters) + clusters=clusters, + term_ids=term_ids) -def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_test.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None, min_df=None, clusters=None, min_date=None, max_date=None,cores=1): +def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_test.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None, min_df=None, clusters=None, min_date=None, max_date=None,cores=1,term_ids=None): return cosine_similarities_weekly_lsi(infile, outfile, 'author', @@ -171,11 +172,12 @@ def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/o clusters=clusters, min_date=min_date, max_date=max_date, - cores=cores + cores=cores, + term_ids=term_ids ) -def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None,clusters=None,cores=1): +def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None,clusters=None,cores=1,term_ids=None): return cosine_similarities_weekly_lsi(infile, outfile, 'term', @@ -186,7 +188,8 @@ def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/out clusters=clusters, min_date=min_date, max_date=max_date, - cores=cores + cores=cores, + term_ids=term_ids ) if __name__ == "__main__":