1
0

add parameters.

This commit is contained in:
Nathan TeBlunthuis 2025-01-12 00:47:47 -08:00
parent b4f9ce0ad2
commit e568ee6db7

View File

@ -147,7 +147,7 @@ def author_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/
clusters=clusters
)
def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', min_df=None, max_df=None, included_subreddits=None, topN=None, static_tfidf_path=None, clusters=None):
def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', min_df=None, max_df=None, included_subreddits=None, topN=None, static_tfidf_path=None, clusters=None,term_ids=None):
return cosine_similarities_weekly(infile,
outfile,
'term',
@ -156,10 +156,11 @@ def term_cosine_similarities_weekly(outfile, infile='/gscratch/comdata/output/re
included_subreddits,
topN,
static_tfidf_path=static_tfidf_path,
clusters=clusters)
clusters=clusters,
term_ids=term_ids)
def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_test.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None, min_df=None, clusters=None, min_date=None, max_date=None,cores=1):
def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_test.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None, min_df=None, clusters=None, min_date=None, max_date=None,cores=1,term_ids=None):
return cosine_similarities_weekly_lsi(infile,
outfile,
'author',
@ -171,11 +172,12 @@ def author_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/o
clusters=clusters,
min_date=min_date,
max_date=max_date,
cores=cores
cores=cores,
term_ids=term_ids
)
def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None,clusters=None,cores=1):
def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet', included_subreddits=None, n_components=100,lsi_model=None,static_tfidf_path=None,clusters=None,cores=1,term_ids=None):
return cosine_similarities_weekly_lsi(infile,
outfile,
'term',
@ -186,7 +188,8 @@ def term_cosine_similarities_weekly_lsi(outfile, infile = '/gscratch/comdata/out
clusters=clusters,
min_date=min_date,
max_date=max_date,
cores=cores
cores=cores,
term_ids=term_ids
)
if __name__ == "__main__":