Update app.py
Browse files
app.py
CHANGED
@@ -34,6 +34,9 @@ def load_reddit_split(subreddit_name):
|
|
34 |
# Combine subreddit data
|
35 |
combined_dataset = chain(*(load_reddit_split(sub) for sub in target_subreddits))
|
36 |
|
|
|
|
|
|
|
37 |
# PySpark session
|
38 |
spark = SparkSession.builder.getOrCreate()
|
39 |
df = spark.createDataFrame([{"body": ex["body"]} for ex in islice(combined_dataset, 100000)])
|
|
|
34 |
# Combine subreddit data
|
35 |
combined_dataset = chain(*(load_reddit_split(sub) for sub in target_subreddits))
|
36 |
|
37 |
+
if "JAVA_HOME" not in os.environ:
|
38 |
+
os.environ["JAVA_HOME"] = "/usr/lib/jvm/java-11-openjdk-amd64" # Common path on HF Spaces/Debian
|
39 |
+
|
40 |
# PySpark session
|
41 |
spark = SparkSession.builder.getOrCreate()
|
42 |
df = spark.createDataFrame([{"body": ex["body"]} for ex in islice(combined_dataset, 100000)])
|