Spaces:

Tymec
/

sentiment-analysis

Runtime error

Tymec commited on Jun 2, 2024

Commit

c5ed75e

1 Parent(s): d09d1f6

Add document frequency threshold

Files changed (1) hide show

app/model.py CHANGED Viewed

@@ -62,11 +62,6 @@ def train_model(
         random_state=seed,
     )
-    param_distributions = {
-        "classifier__C": np.logspace(-4, 4, 20),
-        "classifier__solver": ["liblinear", "saga"],
-    }
     model = Pipeline(
         [
             (
@@ -79,6 +74,8 @@ def train_model(
                     preprocessor=_identity,
                     lowercase=False,
                     token_pattern=None,
                 ),
             ),
             (
@@ -93,6 +90,11 @@ def train_model(
         verbose=verbose,
     )
     search = RandomizedSearchCV(
         model,
         param_distributions,

         random_state=seed,
     )
     model = Pipeline(
         [
             (
                     preprocessor=_identity,
                     lowercase=False,
                     token_pattern=None,
+                    min_df=0.1,
+                    max_df=0.9,
                 ),
             ),
             (
         verbose=verbose,
     )
+    param_distributions = {
+        "classifier__C": np.logspace(-4, 4, 20),
+        "classifier__solver": ["liblinear", "saga"],
+    }
     search = RandomizedSearchCV(
         model,
         param_distributions,