Spaces:
Runtime error
Runtime error
Fixed file paths
Browse files
app.py
CHANGED
|
@@ -6,15 +6,18 @@ import pandas as pd
|
|
| 6 |
from datasets import load_dataset
|
| 7 |
import json
|
| 8 |
|
| 9 |
-
##Load Dataset
|
| 10 |
#dataset = load_dataset("rshah/million-headlines")
|
| 11 |
#news = pd.DataFrame.from_dict(dataset["train"])
|
| 12 |
-
|
|
|
|
|
|
|
| 13 |
news['date'] = pd.to_datetime(news['publish_date'], format='%Y%m%d')
|
| 14 |
timestamps = news.date.to_list()
|
| 15 |
tweets = news.headline_text.to_list()
|
| 16 |
|
| 17 |
-
|
|
|
|
| 18 |
topics = json.load(fp)
|
| 19 |
|
| 20 |
option_n = 5
|
|
|
|
| 6 |
from datasets import load_dataset
|
| 7 |
import json
|
| 8 |
|
| 9 |
+
##Load Dataset from HF Hub
|
| 10 |
#dataset = load_dataset("rshah/million-headlines")
|
| 11 |
#news = pd.DataFrame.from_dict(dataset["train"])
|
| 12 |
+
|
| 13 |
+
#Load dataset locally - faster for demo
|
| 14 |
+
news = pd.read_parquet("topic_10000.par")
|
| 15 |
news['date'] = pd.to_datetime(news['publish_date'], format='%Y%m%d')
|
| 16 |
timestamps = news.date.to_list()
|
| 17 |
tweets = news.headline_text.to_list()
|
| 18 |
|
| 19 |
+
#Load topics
|
| 20 |
+
with open("topics", "r") as fp:
|
| 21 |
topics = json.load(fp)
|
| 22 |
|
| 23 |
option_n = 5
|