bugfix in completing tfidf similarity matrices.
This commit is contained in:
parent
220a540beb
commit
e794214653
@ -71,8 +71,8 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
|
|||||||
similarities = similarities.join(df, on='j')
|
similarities = similarities.join(df, on='j')
|
||||||
similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
|
similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
|
||||||
|
|
||||||
similarities.write_feather(output_feather)
|
similarities.to_feather(output_feather)
|
||||||
similarities.write_csv(output_csv)
|
similarities.to_csv(output_csv)
|
||||||
return similarities
|
return similarities
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
@ -71,8 +71,8 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
|
|||||||
similarities = similarities.join(df, on='j')
|
similarities = similarities.join(df, on='j')
|
||||||
similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
|
similarities = similarities.rename(columns={'subreddit':"subreddit_j"})
|
||||||
|
|
||||||
similarities.write_feather(output_feather)
|
similarities.to_feather(output_feather)
|
||||||
similarities.write_csv(output_csv)
|
similarities.to_csv(output_csv)
|
||||||
return similarities
|
return similarities
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
Loading…
Reference in New Issue
Block a user