]> code.communitydata.science - cdsc_reddit.git/commitdiff
Bugfix (typo)
authorNate E TeBlunthuis <nathante@n2347.hyak.local>
Tue, 10 Nov 2020 21:38:11 +0000 (13:38 -0800)
committerNate E TeBlunthuis <nathante@n2347.hyak.local>
Tue, 10 Nov 2020 21:38:11 +0000 (13:38 -0800)
term_cosine_similarity.py

index c487c5beb8a576644d7c9cf09e90f7ed66889bce..44af4e606082185611b077100b7ab24cd7397e1a 100644 (file)
@@ -47,7 +47,7 @@ https://stanford.edu/~rezab/papers/dimsum.pdf. If similarity_threshold=0 we get
     if exclude_phrases == True:
         tfidf = tfidf.filter(~f.col(term).contains("_"))
 
     if exclude_phrases == True:
         tfidf = tfidf.filter(~f.col(term).contains("_"))
 
-    sim_dist, tfidf = cosine_similarities(tfidf, 'term', min_df, include_subreddits, similarity_threshold)
+    sim_dist, tfidf = cosine_similarities(tfidf, 'term', min_df, included_subreddits, similarity_threshold)
 
     p = Path(outfile)
 
 
     p = Path(outfile)
 

Community Data Science Collective || Want to submit a patch?