]> code.communitydata.science - cdsc_reddit.git/blobdiff - dumps/check_comments_shas.py
Merge remote-tracking branch 'refs/remotes/origin/excise_reindex' into excise_reindex
[cdsc_reddit.git] / dumps / check_comments_shas.py
index 199261c0c957c952246ae6b4cf43550a965597fc..e59a7b83e2ec78e08eb2fb8ab3af36816ac205f8 100755 (executable)
@@ -6,9 +6,9 @@ from os import path
 import hashlib
 
 shasums1 = requests.get("https://files.pushshift.io/reddit/comments/sha256sum.txt").text
-shasums2 = requests.get("https://files.pushshift.io/reddit/comments/daily/sha256sum.txt").text
+#shasums2 = requests.get("https://files.pushshift.io/reddit/comments/daily/sha256sum.txt").text
 
-shasums = shasums1 + shasums2
+shasums = shasums1 
 dumpdir = "/gscratch/comdata/raw_data/reddit_dumps/comments"
 
 for l in shasums.strip().split('\n'):

Community Data Science Collective || Want to submit a patch?