Update app.py
Browse files
app.py
CHANGED
|
@@ -34,6 +34,9 @@ def load_reddit_split(subreddit_name):
|
|
| 34 |
# Combine subreddit data
|
| 35 |
combined_dataset = chain(*(load_reddit_split(sub) for sub in target_subreddits))
|
| 36 |
|
|
|
|
|
|
|
|
|
|
| 37 |
# PySpark session
|
| 38 |
spark = SparkSession.builder.getOrCreate()
|
| 39 |
df = spark.createDataFrame([{"body": ex["body"]} for ex in islice(combined_dataset, 100000)])
|
|
|
|
| 34 |
# Combine subreddit data
|
| 35 |
combined_dataset = chain(*(load_reddit_split(sub) for sub in target_subreddits))
|
| 36 |
|
| 37 |
+
if "JAVA_HOME" not in os.environ:
|
| 38 |
+
os.environ["JAVA_HOME"] = "/usr/lib/jvm/java-11-openjdk-amd64" # Common path on HF Spaces/Debian
|
| 39 |
+
|
| 40 |
# PySpark session
|
| 41 |
spark = SparkSession.builder.getOrCreate()
|
| 42 |
df = spark.createDataFrame([{"body": ex["body"]} for ex in islice(combined_dataset, 100000)])
|