Tymec commited on
Commit
e50b20c
1 Parent(s): a5c3a23

Add dataset for testing

Browse files
Files changed (2) hide show
  1. README.md +3 -1
  2. app/constants.py +3 -0
README.md CHANGED
@@ -11,6 +11,7 @@ datasets:
11
  - mrshu/amazonreviews
12
  - stanfordnlp/sentiment140
13
  - stanfordnlp/imdb
 
14
  models:
15
  - spacy/en_core_web_sm
16
  ---
@@ -21,12 +22,13 @@ models:
21
  1. Clone the repository
22
  2. `cd` into the repository
23
  3. Run `just install` to install the dependencies
24
- 4. Run `just app --help` to see the available commands
25
 
26
  ### Datasets
27
  - [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
28
  - [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
29
  - [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
 
30
 
31
  ### Required tools
32
  - `just`
 
11
  - mrshu/amazonreviews
12
  - stanfordnlp/sentiment140
13
  - stanfordnlp/imdb
14
+ - Sp1786/multiclass-sentiment-analysis-dataset
15
  models:
16
  - spacy/en_core_web_sm
17
  ---
 
22
  1. Clone the repository
23
  2. `cd` into the repository
24
  3. Run `just install` to install the dependencies
25
+ 4. Run `just run --help` to see the available commands
26
 
27
  ### Datasets
28
  - [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
29
  - [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
30
  - [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
31
+ - [Multiclass Sentiment Analysis](https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset) (Used only testing)
32
 
33
  ### Required tools
34
  - `just`
app/constants.py CHANGED
@@ -16,6 +16,9 @@ AMAZONREVIEWS_URL = "https://www.kaggle.com/datasets/bittlingmayer/amazonreviews
16
  IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
17
  IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
18
 
 
 
 
19
  CACHE_DIR.mkdir(exist_ok=True, parents=True)
20
  DATA_DIR.mkdir(exist_ok=True, parents=True)
21
  MODELS_DIR.mkdir(exist_ok=True, parents=True)
 
16
  IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
17
  IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
18
 
19
+ TEST_DATASET_PATH = DATA_DIR / "test.csv"
20
+ TEST_DATASET_URL = "https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset"
21
+
22
  CACHE_DIR.mkdir(exist_ok=True, parents=True)
23
  DATA_DIR.mkdir(exist_ok=True, parents=True)
24
  MODELS_DIR.mkdir(exist_ok=True, parents=True)