diff --git a/similarities/weekly_cosine_similarities.py b/similarities/weekly_cosine_similarities.py index 7e1d668..edacca3 100755 --- a/similarities/weekly_cosine_similarities.py +++ b/similarities/weekly_cosine_similarities.py @@ -126,8 +126,11 @@ def cosine_similarities_weekly(tfidf_path, outfile, term_colname, included_subre return outfile.exists() if not overwrite: + print("not overwriting") weeks = [week for week in weeks if not output_exists(week)] + print(weeks, flush=True) + if clusters is not None: clusters_raw = pd.read_feather(clusters) clusters = duckdb.sql("SELECT A.subreddit AS sr_i, B.subreddit AS sr_j FROM clusters_raw AS A JOIN clusters_raw AS B ON A.cluster == B.cluster WHERE A.cluster != -1 AND B.cluster != -1").df()