correct paths.
This commit is contained in:
parent
1cca01fb69
commit
85945eae90
@ -5,8 +5,8 @@ from pyspark.sql import SparkSession
|
|||||||
import numpy as np
|
import numpy as np
|
||||||
|
|
||||||
spark = SparkSession.builder.getOrCreate()
|
spark = SparkSession.builder.getOrCreate()
|
||||||
df = spark.read.text("/gscratch/comdata/users/nathante/reddit_comment_ngrams_10p_sample/")
|
df = spark.read.text("/gscratch/comdata/output/reddit_ngrams/reddit_comment_ngrams_10p_sample/")
|
||||||
df2 = spark.read.text("/gscratch/comdata/users/nathante/reddit_post_ngrams_10p_sample/")
|
df2 = spark.read.text("/gscratch/comdata/output/reddit_ngrams/reddit_post_ngrams_10p_sample/")
|
||||||
df = df.union(df2)
|
df = df.union(df2)
|
||||||
|
|
||||||
df = df.withColumnRenamed("value","phrase")
|
df = df.withColumnRenamed("value","phrase")
|
||||||
|
Loading…
Reference in New Issue
Block a user