]> code.communitydata.science - cdsc_reddit.git/commitdiff
bugfix
authorNate E TeBlunthuis <nathante@klone-login01.hyak.local>
Tue, 27 Apr 2021 05:31:05 +0000 (22:31 -0700)
committerNate E TeBlunthuis <nathante@klone-login01.hyak.local>
Tue, 27 Apr 2021 05:31:05 +0000 (22:31 -0700)
similarities/tfidf.py

index 98a283528e1066bafa2759cb6c548e5eae2caf26..7f579faabb7092dacfb210f913f7b243d4c79337 100644 (file)
@@ -17,7 +17,7 @@ def _tfidf_wrapper(func, inpath, outpath, topN, term_colname, exclude, included_
 
     df = func(df, include_subs, term_colname)
 
 
     df = func(df, include_subs, term_colname)
 
-    df.write.parquet(outpath,mode='overwrite',copmression='snappy')
+    df.write.parquet(outpath,mode='overwrite',compression='snappy')
 
     spark.stop()
 
 
     spark.stop()
 

Community Data Science Collective || Want to submit a patch?