Add reinforce_predictor Core API function as supported by 10.7.3-a.0

popescu-v · popescu-v · commit 4f0bc4d68b23 · 2025-05-27T15:47:13.000+02:00
Also add relevant samples of its usage.
diff --git a/doc/samples/samples.rst b/doc/samples/samples.rst
@@ -686,6 +686,37 @@ Samples
     kh.interpret_predictor(predictor_file_path, "SNB_Adult", interpretor_file_path)
 
     print(f"The interpretation model is '{interpretor_file_path}'")
+.. autofunction:: reinforce_predictor
+.. code-block:: python
+
+    # Imports
+    import os
+    from khiops import core as kh
+
+    dictionary_file_path = os.path.join(kh.get_samples_dir(), "Adult", "Adult.kdic")
+    data_table_path = os.path.join(kh.get_samples_dir(), "Adult", "Adult.txt")
+    output_dir = os.path.join("kh_samples", "reinforce_predictor")
+    analysis_report_file_path = os.path.join(output_dir, "AnalysisResults.khj")
+    reinforced_predictor_file_path = os.path.join(output_dir, "ReinforcedAdultModel.kdic")
+
+    # Build prediction model
+    _, predictor_file_path = kh.train_predictor(
+        dictionary_file_path,
+        "Adult",
+        data_table_path,
+        "class",
+        analysis_report_file_path,
+    )
+
+    # Build reinforced predictor
+    kh.reinforce_predictor(
+        predictor_file_path,
+        "SNB_Adult",
+        reinforced_predictor_file_path,
+        reinforcement_lever_variables=["occupation"],
+    )
+
+    print(f"The reinforced predictor is '{reinforced_predictor_file_path}'")
 .. autofunction:: multiple_train_predictor
 .. code-block:: python
 
@@ -1102,6 +1133,53 @@ Samples
         output_data_table_path,
         additional_data_tables={"Vehicles": vehicles_table_path},
     )
+.. autofunction:: deploy_reinforced_model_mt
+.. code-block:: python
+
+    # Imports
+    import os
+    from khiops import core as kh
+
+    # Set the file paths
+    accidents_dir = os.path.join(kh.get_samples_dir(), "AccidentsSummary")
+    dictionary_file_path = os.path.join(accidents_dir, "Accidents.kdic")
+    accidents_table_path = os.path.join(accidents_dir, "Accidents.txt")
+    vehicles_table_path = os.path.join(accidents_dir, "Vehicles.txt")
+    output_dir = os.path.join("kh_samples", "deploy_reinforced_model_mt")
+    report_file_path = os.path.join(output_dir, "AnalysisResults.khj")
+    reinforced_predictor_file_path = os.path.join(output_dir, "ReinforcedModel.kdic")
+    output_data_table_path = os.path.join(output_dir, "ReinforcedAccidents.txt")
+
+    # Train the predictor (see train_predictor_mt for details)
+    _, model_dictionary_file_path = kh.train_predictor(
+        dictionary_file_path,
+        "Accident",
+        accidents_table_path,
+        "Gravity",
+        report_file_path,
+        additional_data_tables={"Vehicles": vehicles_table_path},
+        max_trees=0,
+    )
+
+    # Reinforce the predictor
+    kh.reinforce_predictor(
+        model_dictionary_file_path,
+        "SNB_Accident",
+        reinforced_predictor_file_path,
+        reinforcement_target_value="NonLethal",
+        reinforcement_lever_variables=["InAgglomeration", "CollisionType"],
+    )
+
+    # Deploy the reinforced model on the database
+    # Besides the mandatory parameters, it is specified:
+    # - A python dictionary linking data paths to file paths for non-root tables
+    kh.deploy_model(
+        reinforced_predictor_file_path,
+        "Reinforcement_SNB_Accident",
+        accidents_table_path,
+        output_data_table_path,
+        additional_data_tables={"Vehicles": vehicles_table_path},
+    )
 .. autofunction:: deploy_model_mt_snowflake
 .. code-block:: python
 
diff --git a/khiops/core/api.py b/khiops/core/api.py
@@ -929,6 +929,69 @@ def interpret_predictor(
     _run_task("interpret_predictor", task_args)
 
 
+def reinforce_predictor(
+    dictionary_file_path_or_domain,
+    predictor_dictionary_name,
+    reinforced_predictor_file_path,
+    reinforcement_target_value="",
+    reinforcement_lever_variables=None,
+    log_file_path=None,
+    output_scenario_path=None,
+    task_file_path=None,
+    trace=False,
+    stdout_file_path="",
+    stderr_file_path="",
+    max_cores=None,
+    memory_limit_mb=None,
+    temp_dir="",
+    scenario_prologue="",
+    **kwargs,
+):
+    r"""Builds a reinforced predictor from a predictor
+
+    A reinforced predictor is a model which increases the importance of specified lever
+    variables in order to increase the probability of occurrence of the specified target
+    value.
+
+    Parameters
+    ----------
+    dictionary_file_path_or_domain : str or `.DictionaryDomain`
+        Path of a Khiops dictionary file or a DictionaryDomain object.
+    predictor_dictionary_name : str
+        Name of the predictor dictionary used while building the reinforced predictor.
+    reinforced_predictor_file_path : str
+        Path to the reinforced predictor dictionary file.
+    reinforcement_target_value : str, default ""
+        If this target value is specified, then its probability of occurrence is
+        tentatively increased.
+    reinforcement_lever_variables : list of str
+        The names of variables to use as lever variables while building the
+        reinforced predictor. Min length: 1. Max length: the total number of variables
+        in the prediction model.
+    ... :
+        See :ref:`core-api-common-params`.
+
+    Raises
+    ------
+    `ValueError`
+        Invalid values of an argument
+    `TypeError`
+        Invalid type of an argument
+
+    Examples
+    --------
+    See the following functions of the ``samples.py`` documentation script:
+        - `samples.reinforce_predictor()`
+        - `samples.deploy_reinforced_model_mt()`
+    """
+    # Save the task arguments
+    # WARNING: Do not move this line, see the top of the "tasks" section for details
+    task_args = locals()
+
+    # Run the task
+    _run_task("reinforce_predictor", task_args)
+
+
 def evaluate_predictor(
     dictionary_file_path_or_domain,
     train_dictionary_name,
diff --git a/khiops/core/internals/tasks/__init__.py b/khiops/core/internals/tasks/__init__.py
@@ -22,6 +22,7 @@
     extract_keys_from_data_table,
     interpret_predictor,
     prepare_coclustering_deployment,
+    reinforce_predictor,
     simplify_coclustering,
     sort_data_table,
     train_coclustering,
@@ -43,6 +44,7 @@
     extract_clusters,
     extract_keys_from_data_table,
     interpret_predictor,
+    reinforce_predictor,
     prepare_coclustering_deployment,
     simplify_coclustering,
     sort_data_table,
diff --git a/khiops/core/internals/tasks/reinforce_predictor.py b/khiops/core/internals/tasks/reinforce_predictor.py
@@ -0,0 +1,60 @@
+######################################################################################
+# Copyright (c) 2023-2025 Orange. All rights reserved.                               #
+# This software is distributed under the BSD 3-Clause-clear License, the text of     #
+# which is available at https://spdx.org/licenses/BSD-3-Clause-Clear.html or         #
+# see the "LICENSE.md" file for more details.                                        #
+######################################################################################
+"""reinforce_predictor task family"""
+from khiops.core.internals import task as tm
+from khiops.core.internals.types import ListType, StringLikeType
+
+# Disable long lines to have readable scenarios
+# pylint: disable=line-too-long
+TASKS = [
+    tm.KhiopsTask(
+        "reinforce_predictor",
+        "khiops",
+        "10.7.3-a.0",
+        [
+            ("dictionary_file_path", StringLikeType),
+            ("predictor_dictionary_name", StringLikeType),
+            ("reinforced_predictor_file_path", StringLikeType),
+        ],
+        [
+            ("reinforcement_target_value", StringLikeType, ""),
+            ("reinforcement_lever_variables", ListType(StringLikeType), None),
+        ],
+        ["dictionary_file_path", "reinforced_predictor_file_path"],
+        # pylint: disable=line-too-long
+        # fmt: off
+        """
+        // Dictionary file and class settings
+        ClassManagement.OpenFile
+        ClassFileName __dictionary_file_path__
+        OK
+
+        // Reinforcement settings
+        TrainDatabase.ClassName __predictor_dictionary_name__
+
+        // Reinforce model
+        LearningTools.ReinforcePredictor
+        ReinforcedTargetValue __reinforcement_target_value__
+
+        LeverAttributes.UnselectAll
+        __DICT__
+        __reinforcement_lever_variables__
+        LeverAttributes.List.Key
+        LeverAttributes.Used
+        __END_DICT__
+
+        // Build reinforced predictor
+        BuildReinforcementClass
+
+        // Output settings
+        ClassFileName __reinforced_predictor_file_path__
+        OK
+        Exit
+        """,
+        # fmt: on
+    ),
+]
diff --git a/khiops/samples/samples.ipynb b/khiops/samples/samples.ipynb
@@ -908,6 +908,50 @@
     "print(f\"The interpretation model is '{interpretor_file_path}'\")"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### `reinforce_predictor()`\n\n",
+    "Builds reinforced predictor for existing predictor\n\n    The reinforced predictor produces the following reinforcement variables for the\n    specified target value to reinforce (i.e. whose probability of occurrence is\n    tentatively increased):\n\n    - initial score, containing the conditional probability of the target value before\n      reinforcement\n    - four variables are output in decreasing reinforcement value: name of the lever\n      variable, reinforcement part, final score after reinforcement, and class change\n      tag.\n\n    It calls `~.api.train_predictor` and `~.api.reinforce_predictor` only with\n    their mandatory parameters.\n    \n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Imports\n",
+    "import os\n",
+    "from khiops import core as kh\n",
+    "\n",
+    "dictionary_file_path = os.path.join(kh.get_samples_dir(), \"Adult\", \"Adult.kdic\")\n",
+    "data_table_path = os.path.join(kh.get_samples_dir(), \"Adult\", \"Adult.txt\")\n",
+    "output_dir = os.path.join(\"kh_samples\", \"reinforce_predictor\")\n",
+    "analysis_report_file_path = os.path.join(output_dir, \"AnalysisResults.khj\")\n",
+    "reinforced_predictor_file_path = os.path.join(output_dir, \"ReinforcedAdultModel.kdic\")\n",
+    "\n",
+    "# Build prediction model\n",
+    "_, predictor_file_path = kh.train_predictor(\n",
+    "    dictionary_file_path,\n",
+    "    \"Adult\",\n",
+    "    data_table_path,\n",
+    "    \"class\",\n",
+    "    analysis_report_file_path,\n",
+    ")\n",
+    "\n",
+    "# Build reinforced predictor\n",
+    "kh.reinforce_predictor(\n",
+    "    predictor_file_path,\n",
+    "    \"SNB_Adult\",\n",
+    "    reinforced_predictor_file_path,\n",
+    "    reinforcement_lever_variables=[\"occupation\"],\n",
+    ")\n",
+    "\n",
+    "print(f\"The reinforced predictor is '{reinforced_predictor_file_path}'\")"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -1454,6 +1498,66 @@
     ")"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### `deploy_reinforced_model_mt()`\n\n",
+    "Deploys a multi-table reinforced model in the simplest way possible\n\n    It is a call to `~.api.deploy_model` with additional parameters related to\n    the lever variables.\n\n    In this example, a reinforced Selective Naive Bayes (SNB) model is\n    deployed by applying its associated dictionary to the input database.\n    The reinforced model predictions are written to the output data table.\n    \n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Imports\n",
+    "import os\n",
+    "from khiops import core as kh\n",
+    "\n",
+    "# Set the file paths\n",
+    "accidents_dir = os.path.join(kh.get_samples_dir(), \"AccidentsSummary\")\n",
+    "dictionary_file_path = os.path.join(accidents_dir, \"Accidents.kdic\")\n",
+    "accidents_table_path = os.path.join(accidents_dir, \"Accidents.txt\")\n",
+    "vehicles_table_path = os.path.join(accidents_dir, \"Vehicles.txt\")\n",
+    "output_dir = os.path.join(\"kh_samples\", \"deploy_reinforced_model_mt\")\n",
+    "report_file_path = os.path.join(output_dir, \"AnalysisResults.khj\")\n",
+    "reinforced_predictor_file_path = os.path.join(output_dir, \"ReinforcedModel.kdic\")\n",
+    "output_data_table_path = os.path.join(output_dir, \"ReinforcedAccidents.txt\")\n",
+    "\n",
+    "# Train the predictor (see train_predictor_mt for details)\n",
+    "_, model_dictionary_file_path = kh.train_predictor(\n",
+    "    dictionary_file_path,\n",
+    "    \"Accident\",\n",
+    "    accidents_table_path,\n",
+    "    \"Gravity\",\n",
+    "    report_file_path,\n",
+    "    additional_data_tables={\"Vehicles\": vehicles_table_path},\n",
+    "    max_trees=0,\n",
+    ")\n",
+    "\n",
+    "# Reinforce the predictor\n",
+    "kh.reinforce_predictor(\n",
+    "    model_dictionary_file_path,\n",
+    "    \"SNB_Accident\",\n",
+    "    reinforced_predictor_file_path,\n",
+    "    reinforcement_target_value=\"NonLethal\",\n",
+    "    reinforcement_lever_variables=[\"InAgglomeration\", \"CollisionType\"],\n",
+    ")\n",
+    "\n",
+    "# Deploy the reinforced model on the database\n",
+    "# Besides the mandatory parameters, it is specified:\n",
+    "# - A python dictionary linking data paths to file paths for non-root tables\n",
+    "kh.deploy_model(\n",
+    "    reinforced_predictor_file_path,\n",
+    "    \"Reinforcement_SNB_Accident\",\n",
+    "    accidents_table_path,\n",
+    "    output_data_table_path,\n",
+    "    additional_data_tables={\"Vehicles\": vehicles_table_path},\n",
+    ")"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
diff --git a/khiops/samples/samples.py b/khiops/samples/samples.py