version of weekly_cosine_similarities.py from klone
This commit is contained in:
parent
37dd0ef55f
commit
34e0a0a30d
@ -61,7 +61,7 @@ def cosine_similarities_weekly(tfidf_path, outfile, term_colname, min_df = None,
|
|||||||
list(pool.map(weeks,week_similarities_helper))
|
list(pool.map(weeks,week_similarities_helper))
|
||||||
|
|
||||||
def author_cosine_similarities_weekly(outfile, min_df=2 , included_subreddits=None, topN=500):
|
def author_cosine_similarities_weekly(outfile, min_df=2 , included_subreddits=None, topN=500):
|
||||||
return cosine_similarities_weekly('/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_100k.parquet',
|
return cosine_similarities_weekly('/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors_30k.parquet',
|
||||||
outfile,
|
outfile,
|
||||||
'author',
|
'author',
|
||||||
min_df,
|
min_df,
|
||||||
@ -69,7 +69,7 @@ def author_cosine_similarities_weekly(outfile, min_df=2 , included_subreddits=No
|
|||||||
topN)
|
topN)
|
||||||
|
|
||||||
def term_cosine_similarities_weekly(outfile, min_df=None, included_subreddits=None, topN=500):
|
def term_cosine_similarities_weekly(outfile, min_df=None, included_subreddits=None, topN=500):
|
||||||
return cosine_similarities_weekly('/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms_100k.parquet',
|
return cosine_similarities_weekly('/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms_30k.parquet',
|
||||||
outfile,
|
outfile,
|
||||||
'term',
|
'term',
|
||||||
min_df,
|
min_df,
|
||||||
|
Loading…
Reference in New Issue
Block a user