From: Nate E TeBlunthuis Date: Fri, 3 Jul 2020 21:00:36 +0000 (-0700) Subject: Rename spark script to reflect that it is for comments. X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/commitdiff_plain/6dca79a41fbd5d1e967ba2cbd12da55310e5858f?ds=inline;hp=94c7a74bd9a17acf4cca61da48557a93d49cee36 Rename spark script to reflect that it is for comments. --- diff --git a/reddit_bz2_2parquet.py b/comments_2_parquet.py similarity index 98% rename from reddit_bz2_2parquet.py rename to comments_2_parquet.py index 93c3d45..3042f58 100755 --- a/reddit_bz2_2parquet.py +++ b/comments_2_parquet.py @@ -6,7 +6,7 @@ from pyspark.sql.types import * from pyspark import SparkConf, SparkContext from pyspark.sql import SparkSession, SQLContext -conf = SparkConf().setAppName("Reddit to bz2") +conf = SparkConf().setAppName("Reddit comments to parquet") conf = conf.set('spark.sql.crossJoin.enabled',"true") spark = SparkSession.builder.getOrCreate()