]> code.communitydata.science - cdsc_reddit.git/blobdiff - fit_tsne.py
git-annex in nathante@nate-x1:~/cdsc_reddit
[cdsc_reddit.git] / fit_tsne.py
index 37341d47ad8eec933c4acc58fee7d5b9af374a9a..7de2ac015f7960a5a37dfa7b5d54fcb6d1ebaae6 100644 (file)
@@ -24,11 +24,11 @@ mat = np.stack(mat)
 mat = mat + np.tril(mat.transpose(),k=-1)
 dist = 2*np.arccos(mat)/np.pi
 
-tsne_model = TSNE(2,learning_rate=200,perplexity=40,n_iter=5000,metric='precomputed')
+tsne_model = TSNE(2,learning_rate=750,perplexity=50,n_iter=10000,metric='precomputed',early_exaggeration=20,n_jobs=-1)
 
 tsne_fit_model = tsne_model.fit(dist)
 
-tsne_fit_whole = tsne_fit_model.fit_transform(mat)
+tsne_fit_whole = tsne_fit_model.fit_transform(dist)
 
 plot_data = pd.DataFrame({'x':tsne_fit_whole[:,0],'y':tsne_fit_whole[:,1], 'subreddit':col_names})
 

Community Data Science Collective || Want to submit a patch?