X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/34185337c9c6f073ce8f8cb0e1b7ea605861b6e8..4ec9c1424711eb81edf6b6431d5dfae360013174:/comments_2_parquet.py?ds=sidebyside diff --git a/comments_2_parquet.py b/comments_2_parquet.py index bd853f7..8716abd 100755 --- a/comments_2_parquet.py +++ b/comments_2_parquet.py @@ -1,5 +1,5 @@ - #!/usr/bin/env python3 + import pyspark from pyspark.sql import functions as f from pyspark.sql.types import *