Spaces:
Running
Running
Add dataset for testing
Browse files- README.md +3 -1
- app/constants.py +3 -0
README.md
CHANGED
@@ -11,6 +11,7 @@ datasets:
|
|
11 |
- mrshu/amazonreviews
|
12 |
- stanfordnlp/sentiment140
|
13 |
- stanfordnlp/imdb
|
|
|
14 |
models:
|
15 |
- spacy/en_core_web_sm
|
16 |
---
|
@@ -21,12 +22,13 @@ models:
|
|
21 |
1. Clone the repository
|
22 |
2. `cd` into the repository
|
23 |
3. Run `just install` to install the dependencies
|
24 |
-
4. Run `just
|
25 |
|
26 |
### Datasets
|
27 |
- [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
|
28 |
- [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
|
29 |
- [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
|
|
|
30 |
|
31 |
### Required tools
|
32 |
- `just`
|
|
|
11 |
- mrshu/amazonreviews
|
12 |
- stanfordnlp/sentiment140
|
13 |
- stanfordnlp/imdb
|
14 |
+
- Sp1786/multiclass-sentiment-analysis-dataset
|
15 |
models:
|
16 |
- spacy/en_core_web_sm
|
17 |
---
|
|
|
22 |
1. Clone the repository
|
23 |
2. `cd` into the repository
|
24 |
3. Run `just install` to install the dependencies
|
25 |
+
4. Run `just run --help` to see the available commands
|
26 |
|
27 |
### Datasets
|
28 |
- [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
|
29 |
- [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
|
30 |
- [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
|
31 |
+
- [Multiclass Sentiment Analysis](https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset) (Used only testing)
|
32 |
|
33 |
### Required tools
|
34 |
- `just`
|
app/constants.py
CHANGED
@@ -16,6 +16,9 @@ AMAZONREVIEWS_URL = "https://www.kaggle.com/datasets/bittlingmayer/amazonreviews
|
|
16 |
IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
|
17 |
IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
|
18 |
|
|
|
|
|
|
|
19 |
CACHE_DIR.mkdir(exist_ok=True, parents=True)
|
20 |
DATA_DIR.mkdir(exist_ok=True, parents=True)
|
21 |
MODELS_DIR.mkdir(exist_ok=True, parents=True)
|
|
|
16 |
IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
|
17 |
IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
|
18 |
|
19 |
+
TEST_DATASET_PATH = DATA_DIR / "test.csv"
|
20 |
+
TEST_DATASET_URL = "https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset"
|
21 |
+
|
22 |
CACHE_DIR.mkdir(exist_ok=True, parents=True)
|
23 |
DATA_DIR.mkdir(exist_ok=True, parents=True)
|
24 |
MODELS_DIR.mkdir(exist_ok=True, parents=True)
|