Merge pull request #427 from cisco/vidamoda/change_param_behaviour

Change behavior of param and param selection merging
cisco · Jul 22, 2022 · 562dc8d · 562dc8d
2 parents 238412f + b85faf9
commit 562dc8d
Show file tree

Hide file tree

Showing 7 changed files with 47 additions and 16 deletions.
diff --git a/mindmeld/components/_config.py b/mindmeld/components/_config.py
@@ -44,6 +44,9 @@
 DEFAULT_DOMAIN_CLASSIFIER_CONFIG = {
     "model_type": "text",
     "model_settings": {"classifier_type": "logreg"},
+    "params": {
+        "solver": "liblinear",
+    },
     "param_selection": {
         "type": "k-fold",
         "k": 10,
@@ -55,6 +58,9 @@
 DEFAULT_INTENT_CLASSIFIER_CONFIG = {
     "model_type": "text",
     "model_settings": {"classifier_type": "logreg"},
+    "params": {
+        "solver": "liblinear",
+    },
     "param_selection": {
         "type": "k-fold",
         "k": 10,
@@ -80,6 +86,9 @@
         "tag_scheme": "IOB",
         "feature_scaler": "max-abs",
     },
+    "params": {
+        "solver": "liblinear",
+    },
     "param_selection": {
         "type": "k-fold",
         "k": 5,
@@ -109,7 +118,7 @@
 DEFAULT_ROLE_CLASSIFIER_CONFIG = {
     "model_type": "text",
     "model_settings": {"classifier_type": "logreg"},
-    "params": {"C": 100, "penalty": "l1"},
+    "params": {"C": 100, "penalty": "l1", "solver": "liblinear"},
     "features": {
         "bag-of-words-before": {
             "ngram_lengths_to_start_positions": {1: [-2, -1], 2: [-2, -1]}
@@ -549,6 +558,17 @@ class NlpConfigError(Exception):
     pass
 
 
+def merge_param_configs(default_dict, user_defined_dict):
+    new_dict = dict(user_defined_dict)
+    if "params" not in default_dict:
+        return new_dict
+    if "params" in user_defined_dict:
+        new_dict["params"] = {**default_dict["params"], **user_defined_dict["params"]}
+    else:
+        new_dict["params"] = default_dict["params"]
+    return new_dict
+
+
 def get_custom_action_config(app_path):
     if not app_path:
         return None
@@ -669,8 +689,8 @@ def get_system_entity_url_config(app_path):
 
     return (
         get_nlp_config(app_path)
-        .get("system_entity_recognizer", {})
-        .get("url", DEFAULT_DUCKLING_URL)
+            .get("system_entity_recognizer", {})
+            .get("url", DEFAULT_DUCKLING_URL)
     )
 
 
@@ -743,7 +763,7 @@ def get_classifier_config(
             try:
                 raw_args = {"domain": domain, "intent": intent, "entity": entity}
                 args = {k: raw_args[k] for k in func_args}
-                return copy.deepcopy(func(**args))
+                return merge_param_configs(_get_default_classifier_config(clf_type), copy.deepcopy(func(**args)))
             except Exception as exc:  # pylint: disable=broad-except
                 # Note: this is intentionally broad -- provider could raise any exception
                 logger.warning(
@@ -759,7 +779,8 @@ def get_classifier_config(
         "question_answering": "QUESTION_ANSWERER_CONFIG",
     }[clf_type]
     try:
-        return copy.deepcopy(getattr(module_conf, attr_name))
+        return merge_param_configs(_get_default_classifier_config(clf_type),
+                                   copy.deepcopy(getattr(module_conf, attr_name)))
     except AttributeError:
         try:
             result = copy.deepcopy(

diff --git a/mindmeld/components/classifier.py b/mindmeld/components/classifier.py
@@ -411,12 +411,11 @@ def _get_model_config(loaded_config=None, **kwargs):
             if not loaded_config:
                 logger.warning("loaded_config is not passed in")
             model_config = loaded_config or {}
+            if 'params' in model_config and 'params' in kwargs:
+                kwargs['params'].update(model_config['params'])
+
             model_config.update(kwargs)
 
-            # If a parameter selection grid was passed in at runtime, override params set in the
-            # application specified or default config
-            if kwargs.get("param_selection") and not kwargs.get("params"):
-                model_config.pop("params", None)
         return ModelConfig(**model_config)
 
     def dump(self, model_path, incremental_model_path=None):

diff --git a/mindmeld/models/model.py b/mindmeld/models/model.py
@@ -429,7 +429,7 @@ def _fit(self, examples, labels, params=None):
     def _get_model_constructor(self):
         raise NotImplementedError
 
-    def _fit_cv(self, examples, labels, groups=None, selection_settings=None):
+    def _fit_cv(self, examples, labels, groups=None, selection_settings=None, fixed_params=None):
         """Called by the fit method when cross validation parameters are passed in. Runs cross
         validation and returns the best estimator and parameters.
 
@@ -463,6 +463,16 @@ def _fit_cv(self, examples, labels, groups=None, selection_settings=None):
 
         param_grid = self._convert_params(selection_settings["grid"], labels)
         model_class = self._get_model_constructor()
+        if fixed_params:
+            for key, val in fixed_params.items():
+                if key not in param_grid:
+                    param_grid[key] = [val]
+                else:
+                    logger.info(
+                        "Found parameter %s both in params and param_selection. Proceeding with param_selection.. \
+                        (If you did not set this, it could be a Mindmeld default.)",
+                        key
+                    )
         estimator, param_grid = self._get_cv_estimator_and_params(
             model_class, param_grid
         )

diff --git a/mindmeld/models/tagger_models.py b/mindmeld/models/tagger_models.py
@@ -217,7 +217,7 @@ def fit(self, examples, labels, params=None):
             labels (ProcessedQueryList.EntitiesIterator): A list of expected labels.
             params (dict): Parameters of the classifier.
         """
-        skip_param_selection = params is not None or self.config.param_selection is None
+        skip_param_selection = self.config.param_selection is None
         params = params or self.config.params
 
         # Shuffle to prevent order effects
@@ -253,7 +253,7 @@ def fit(self, examples, labels, params=None):
             if isinstance(self._clf, non_supported_classes):
                 raise MindMeldError(f"The {type(self._clf).__name__} model does not support cross-validation")
 
-            _, best_params = self._fit_cv(X, y, groups)
+            _, best_params = self._fit_cv(X, y, groups, fixed_params=params)
             self._clf = self._fit(X, y, best_params)
             self._current_params = best_params
 

diff --git a/mindmeld/models/text_models.py b/mindmeld/models/text_models.py
@@ -434,7 +434,7 @@ def fit(self, examples, labels, params=None):
                 interfaces.
         """
         params = params or self.config.params
-        skip_param_selection = params is not None or self.config.param_selection is None
+        skip_param_selection = self.config.param_selection is None
 
         # Shuffle to prevent order effects
         indices = list(range(len(labels)))
@@ -454,7 +454,7 @@ def fit(self, examples, labels, params=None):
             self._current_params = params
         else:
             # run cross validation to select params
-            best_clf, best_params = self._fit_cv(X, y, groups)
+            best_clf, best_params = self._fit_cv(X, y, groups, fixed_params=params)
             self._clf = best_clf
             self._current_params = best_params
 

diff --git a/tests/components/test_config.py b/tests/components/test_config.py
@@ -128,7 +128,7 @@ def test_get_classifier_config_func():
         "entity", APP_PATH, domain="domain", intent="intent"
     )["params"]
 
-    expected = {"penalty": "l2", "C": 100}
+    expected = {"penalty": "l2", "C": 100, "solver": "liblinear"}
 
     assert actual == expected
 
@@ -139,7 +139,7 @@ def test_get_classifier_config_func_error():
         "params"
     ]
 
-    expected = {"error": "intent", "penalty": "l2", "C": 100}
+    expected = {"error": "intent", "penalty": "l2", "C": 100, "solver": "liblinear"}
 
     assert actual == expected
 

diff --git a/tests/components/test_intent_classifier.py b/tests/components/test_intent_classifier.py
@@ -74,3 +74,4 @@ def test_intent_classifier_random_forest(kwik_e_mart_app_path, caplog):
         mock.assert_any_call(
             "Unexpected param `fit_intercept`, dropping it from model config."
         )
+        mock.assert_any_call("Unexpected param `solver`, dropping it from model config.")