13
0

bugfix in completing tfidf similarity matrices.

This commit is contained in:
Nate E TeBlunthuis 2020-11-12 11:47:53 -08:00
parent 220a540beb
commit e794214653
2 changed files with 4 additions and 4 deletions

View File

@ -71,8 +71,8 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
similarities = similarities.join(df, on='j') similarities = similarities.join(df, on='j')
similarities = similarities.rename(columns={'subreddit':"subreddit_j"}) similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
similarities.write_feather(output_feather) similarities.to_feather(output_feather)
similarities.write_csv(output_csv) similarities.to_csv(output_csv)
return similarities return similarities
if __name__ == '__main__': if __name__ == '__main__':

View File

@ -71,8 +71,8 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
similarities = similarities.join(df, on='j') similarities = similarities.join(df, on='j')
similarities = similarities.rename(columns={'subreddit':"subreddit_j"}) similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
similarities.write_feather(output_feather) similarities.to_feather(output_feather)
similarities.write_csv(output_csv) similarities.to_csv(output_csv)
return similarities return similarities
if __name__ == '__main__': if __name__ == '__main__':