topN,
exclude_phrases,
from_date,
- to_date)
+ to_date
+ )
def author_cosine_similarities(outfile, min_df=2, max_df=None, included_subreddits=None, topN=10000, from_date=None, to_date=None):
return cosine_similarities('/gscratch/comdata/output/reddit_similarity/tfidf/comment_authors.parquet',
topN,
exclude_phrases=False,
from_date=from_date,
- to_date=to_date)
+ to_date=to_date
+ )
def author_tf_similarities(outfile, min_df=2, max_df=None, included_subreddits=None, topN=10000, from_date=None, to_date=None):
return cosine_similarities('/gscratch/comdata/output/reddit_similarity/tfidf/comment_authors.parquet',
exclude_phrases=False,
from_date=from_date,
to_date=to_date,
- tfidf_colname='relative_tf')
+ tfidf_colname='relative_tf'
+ )
if __name__ == "__main__":