]> code.communitydata.science - cdsc_reddit.git/blobdiff - term_cosine_similarity.py
Bugfix (typo)
[cdsc_reddit.git] / term_cosine_similarity.py
index c487c5beb8a576644d7c9cf09e90f7ed66889bce..44af4e606082185611b077100b7ab24cd7397e1a 100644 (file)
@@ -47,7 +47,7 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
     if exclude_phrases == True:
         tfidf = tfidf.filter(~f.col(term).contains("_"))
 
-    sim_dist, tfidf = cosine_similarities(tfidf, 'term', min_df, include_subreddits, similarity_threshold)
+    sim_dist, tfidf = cosine_similarities(tfidf, 'term', min_df, included_subreddits, similarity_threshold)
 
     p = Path(outfile)
 

Community Data Science Collective || Want to submit a patch?