Spaces:
Runtime error
Runtime error
Add dataset for testing
Browse files- README.md +3 -1
- app/constants.py +3 -0
README.md
CHANGED
|
@@ -11,6 +11,7 @@ datasets:
|
|
| 11 |
- mrshu/amazonreviews
|
| 12 |
- stanfordnlp/sentiment140
|
| 13 |
- stanfordnlp/imdb
|
|
|
|
| 14 |
models:
|
| 15 |
- spacy/en_core_web_sm
|
| 16 |
---
|
|
@@ -21,12 +22,13 @@ models:
|
|
| 21 |
1. Clone the repository
|
| 22 |
2. `cd` into the repository
|
| 23 |
3. Run `just install` to install the dependencies
|
| 24 |
-
4. Run `just
|
| 25 |
|
| 26 |
### Datasets
|
| 27 |
- [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
|
| 28 |
- [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
|
| 29 |
- [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
|
|
|
|
| 30 |
|
| 31 |
### Required tools
|
| 32 |
- `just`
|
|
|
|
| 11 |
- mrshu/amazonreviews
|
| 12 |
- stanfordnlp/sentiment140
|
| 13 |
- stanfordnlp/imdb
|
| 14 |
+
- Sp1786/multiclass-sentiment-analysis-dataset
|
| 15 |
models:
|
| 16 |
- spacy/en_core_web_sm
|
| 17 |
---
|
|
|
|
| 22 |
1. Clone the repository
|
| 23 |
2. `cd` into the repository
|
| 24 |
3. Run `just install` to install the dependencies
|
| 25 |
+
4. Run `just run --help` to see the available commands
|
| 26 |
|
| 27 |
### Datasets
|
| 28 |
- [Sentiment140](https://www.kaggle.com/datasets/kazanova/sentiment140)
|
| 29 |
- [Amazon Reviews](https://www.kaggle.com/datasets/bittlingmayer/amazonreviews)
|
| 30 |
- [IMDB](https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews)
|
| 31 |
+
- [Multiclass Sentiment Analysis](https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset) (Used only testing)
|
| 32 |
|
| 33 |
### Required tools
|
| 34 |
- `just`
|
app/constants.py
CHANGED
|
@@ -16,6 +16,9 @@ AMAZONREVIEWS_URL = "https://www.kaggle.com/datasets/bittlingmayer/amazonreviews
|
|
| 16 |
IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
|
| 17 |
IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
|
| 18 |
|
|
|
|
|
|
|
|
|
|
| 19 |
CACHE_DIR.mkdir(exist_ok=True, parents=True)
|
| 20 |
DATA_DIR.mkdir(exist_ok=True, parents=True)
|
| 21 |
MODELS_DIR.mkdir(exist_ok=True, parents=True)
|
|
|
|
| 16 |
IMDB50K_PATH = DATA_DIR / "imdb50k.csv"
|
| 17 |
IMDB50K_URL = "https://www.kaggle.com/datasets/lakshmi25npathi/imdb-dataset-of-50k-movie-reviews"
|
| 18 |
|
| 19 |
+
TEST_DATASET_PATH = DATA_DIR / "test.csv"
|
| 20 |
+
TEST_DATASET_URL = "https://huggingface.co/datasets/Sp1786/multiclass-sentiment-analysis-dataset"
|
| 21 |
+
|
| 22 |
CACHE_DIR.mkdir(exist_ok=True, parents=True)
|
| 23 |
DATA_DIR.mkdir(exist_ok=True, parents=True)
|
| 24 |
MODELS_DIR.mkdir(exist_ok=True, parents=True)
|