X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/67857a3b05b9bf7db684b5d2ab34802fa02ab08f..4eb82d2740b67de4bd2b90b9d88659e9311cff6d:/comments_2_parquet.py diff --git a/comments_2_parquet.py b/comments_2_parquet.py index cff1634..8716abd 100755 --- a/comments_2_parquet.py +++ b/comments_2_parquet.py @@ -1,7 +1,7 @@ - #!/usr/bin/env python3 + import pyspark -nfrom pyspark.sql import functions as f +from pyspark.sql import functions as f from pyspark.sql.types import * from pyspark import SparkConf, SparkContext from pyspark.sql import SparkSession, SQLContext