]> code.communitydata.science - cdsc_reddit.git/blobdiff - clustering/fit_tsne.py
add note to try other tf normalization strategies.
[cdsc_reddit.git] / clustering / fit_tsne.py
index 28b0fd30630e4a666d619974f321cffb4ba37470..c9f45f61320ad8eb2cb88583b27388b663f36b19 100644 (file)
@@ -5,7 +5,7 @@ from numpy import random
 import numpy as np
 from sklearn.manifold import TSNE
 
 import numpy as np
 from sklearn.manifold import TSNE
 
-similarities = "term_similarities_10000.feather"
+similarities = "/gscratch/comdata/output/reddit_similarity/subreddit_author_tf_similarities_10000.parquet"
 
 def fit_tsne(similarities, output, learning_rate=750, perplexity=50, n_iter=10000, early_exaggeration=20):
     '''
 
 def fit_tsne(similarities, output, learning_rate=750, perplexity=50, n_iter=10000, early_exaggeration=20):
     '''

Community Data Science Collective || Want to submit a patch?