]> code.communitydata.science - cdsc_reddit.git/tree
Merge remote-tracking branch 'refs/remotes/origin/master' into master synced/master
-rw-r--r-- 75 .gitignore
-rw-r--r-- 10959 README.md
-rw-r--r-- 3172 author_cosine_similarity.py
-rwxr-xr-x 1046 check_comments_shas.py
-rwxr-xr-x 1052 check_submission_shas.py
-rw-r--r-- 815 checkpoint_parallelsql.sbatch
-rw-r--r-- 1725 clustering.py
-rwxr-xr-x 431 comments_2_parquet.sh
-rwxr-xr-x 3819 comments_2_parquet_part1.py
-rwxr-xr-x 1456 comments_2_parquet_part2.py
drwxr-xr-x - examples
-rw-r--r-- 1197 fit_tsne.py
-rw-r--r-- 1604 helper.py
-rwxr-xr-x 611 pull_pushshift_comments.sh
-rwxr-xr-x 758 pull_pushshift_submissions.sh
-rwxr-xr-x 220 run_tf_jobs.sh
-rw-r--r-- 6501 similarities_helper.py
-rw-r--r-- 503 sort_tf_comments.py
-rw-r--r-- 202 submissions_2_parquet.sh
-rwxr-xr-x 4762 submissions_2_parquet_part1.py
-rw-r--r-- 1746 submissions_2_parquet_part2.py
-rw-r--r-- 5395 term_cosine_similarity.py
-rwxr-xr-x 7906 tf_comments.py
-rw-r--r-- 732 tfidf_authors.py
-rw-r--r-- 736 tfidf_comments.py
-rw-r--r-- 2550 top_comment_phrases.py
-rw-r--r-- 915 top_subreddits_by_comments.py
-rw-r--r-- 96 tsne_subreddit_fit.feather
drwxr-xr-x - visualization

Community Data Science Collective || Want to submit a patch?