]> code.communitydata.science - cdsc_reddit.git/commitdiff
Merge remote-tracking branch 'refs/remotes/origin/excise_reindex' into excise_reindex synced/excise_reindex
authorNathan TeBlunthuis <nathante@uw.edu>
Wed, 6 Apr 2022 18:14:13 +0000 (11:14 -0700)
committerNathan TeBlunthuis <nathante@uw.edu>
Wed, 6 Apr 2022 18:14:13 +0000 (11:14 -0700)
1  2 
similarities/lsi_similarities.py
similarities/tfidf.py

Simple merge
index bbae528c0145fdcb98fcda7a9072400c43c60ebb,33562994afc9d50163c41d46361cc9e092900346..c44fd0ddbf14d49f7c96e9f4be92c03bcd5b4c96
@@@ -53,9 -75,11 +75,10 @@@ def tfidf_terms(inpath="/gscratch/comda
                   )
  
  def tfidf_authors_weekly(inpath="/gscratch/comdata/output/reddit_ngrams/comment_authors.parquet",
+                          static_tfidf_path="/gscratch/comdata/output/reddit_similarity/tfidf/comment_authors.parquet",
                           outpath='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_authors.parquet',
                           topN=None,
 -                         included_subreddits=None
 -                         ):
 +                         included_subreddits=None):
  
      return tfidf_weekly(inpath,
                          outpath,
                          )
  
  def tfidf_terms_weekly(inpath="/gscratch/comdata/output/reddit_ngrams/comment_terms.parquet",
+                        static_tfidf_path="/gscratch/comdata/output/reddit_similarity/tfidf/comment_terms.parquet",
                         outpath='/gscratch/comdata/output/reddit_similarity/tfidf_weekly/comment_terms.parquet',
                         topN=None,
 -                       included_subreddits=None
 -                       ):
 +                       included_subreddits=None):
  
  
      return tfidf_weekly(inpath,

Community Data Science Collective || Want to submit a patch?