diff --git a/doc-sources/changelog.rst b/doc-sources/changelog.rst
index 7cf43e09..9de05d67 100644
--- a/doc-sources/changelog.rst
+++ b/doc-sources/changelog.rst
@@ -4,6 +4,23 @@
Changelog
=========
+Version 1.1.0a6 (2024-02-06)
+============================
+
+- **Breaking** Rename ``max_iteration_index`` to ``max_iterations_count`` in ``...TerminateAfterIterations.__init__``
+- Make the Python API guide Jupyter Notebook downloadable
+- Expose all attributes of ``WPB.LearningData``; start to document them in our Python API guide
+- Expose parameters of EvalMaxSAT in our API and command-line interface (see ``lincs learn classification-model --help``):
+
+ - ``--ucncs.max-sat-by-separation.solver`` (for consistency, always ``"eval-max-sat"`` for now)
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads``
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize``
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time``
+ - ``--ucncs.max-sat-by-coalitions.solver`` (for consistency, always ``"eval-max-sat"`` for now)
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.nb-minimize-threads``
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.timeout-fast-minimize``
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.coef-minimize-time``
+
Version 1.1.0a5 (2024-02-01)
============================
diff --git a/doc-sources/conceptual-overview/conceptual-overview.ipynb b/doc-sources/conceptual-overview/conceptual-overview.ipynb
index 1fca336f..d865266d 100644
--- a/doc-sources/conceptual-overview/conceptual-overview.ipynb
+++ b/doc-sources/conceptual-overview/conceptual-overview.ipynb
@@ -21,7 +21,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs classify problem.yml model.yml alternatives.csv\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs classify problem.yml model.yml alternatives.csv\n",
"name,Math,Physics,Literature,History,category\n",
"A,1,1,1,1,\"Full scholarship\"\n",
"B,1,1,1,0,\"Full scholarship\"\n",
diff --git a/doc-sources/get-started.rst b/doc-sources/get-started.rst
index 54e9be05..56f31a55 100644
--- a/doc-sources/get-started.rst
+++ b/doc-sources/get-started.rst
@@ -75,7 +75,7 @@ The generated ``problem.yml`` should look like:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-problem 4 3 --random-seed 40
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classification-problem 4 3 --random-seed 40
kind: classification-problem
format_version: 1
criteria:
@@ -146,7 +146,7 @@ It should look like:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort
kind: ncs-classification-model
format_version: 1
accepted_values:
@@ -219,7 +219,7 @@ It should start with something like this, and contain 1000 alternatives:
.. code:: text
- # Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0
name,"Criterion 1","Criterion 2","Criterion 3","Criterion 4",category
"Alternative 1",0.37454012,0.796543002,0.95071429,0.183434784,"Best category"
"Alternative 2",0.731993914,0.779690981,0.598658502,0.596850157,"Intermediate category 1"
@@ -255,7 +255,7 @@ so it is numerically different:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0
+ # Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0
kind: ncs-classification-model
format_version: 1
accepted_values:
diff --git a/doc-sources/get-started/get-started.ipynb b/doc-sources/get-started/get-started.ipynb
index 52e50d4c..3f4f32b9 100644
--- a/doc-sources/get-started/get-started.ipynb
+++ b/doc-sources/get-started/get-started.ipynb
@@ -48,7 +48,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-problem 4 3 --random-seed 40\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classification-problem 4 3 --random-seed 40\n",
"kind: classification-problem\n",
"format_version: 1\n",
"criteria:\n",
@@ -126,7 +126,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
@@ -211,7 +211,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0\n",
"name,\"Criterion 1\",\"Criterion 2\",\"Criterion 3\",\"Criterion 4\",category\n",
"\"Alternative 1\",0.37454012,0.796543002,0.95071429,0.183434784,\"Best category\"\n",
"\"Alternative 2\",0.731993914,0.779690981,0.598658502,0.596850157,\"Intermediate category 1\"\n",
@@ -260,7 +260,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
diff --git a/doc-sources/user-guide.rst b/doc-sources/user-guide.rst
index 3ffd5e50..c044281f 100644
--- a/doc-sources/user-guide.rst
+++ b/doc-sources/user-guide.rst
@@ -512,7 +512,7 @@ They produce a different kind of model, with the sufficient coalitions specified
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions
+ # Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions
kind: ncs-classification-model
format_version: 1
accepted_values:
diff --git a/doc-sources/user-guide/alglib-learning/alglib-learning.ipynb b/doc-sources/user-guide/alglib-learning/alglib-learning.ipynb
index 6b561860..313bfc7a 100644
--- a/doc-sources/user-guide/alglib-learning/alglib-learning.ipynb
+++ b/doc-sources/user-guide/alglib-learning/alglib-learning.ipynb
@@ -27,7 +27,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver alglib --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver alglib --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
diff --git a/doc-sources/user-guide/gpu-learning/gpu-learning.ipynb b/doc-sources/user-guide/gpu-learning/gpu-learning.ipynb
index 97977930..c9c6c1cc 100644
--- a/doc-sources/user-guide/gpu-learning/gpu-learning.ipynb
+++ b/doc-sources/user-guide/gpu-learning/gpu-learning.ipynb
@@ -27,7 +27,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor gpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor gpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
diff --git a/doc-sources/user-guide/sat-learning/sat-learning.ipynb b/doc-sources/user-guide/sat-learning/sat-learning.ipynb
index a0879a35..a3851b2c 100644
--- a/doc-sources/user-guide/sat-learning/sat-learning.ipynb
+++ b/doc-sources/user-guide/sat-learning/sat-learning.ipynb
@@ -22,7 +22,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
@@ -58,7 +58,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy max-sat-by-separation --ucncs.max-sat-by-separation.solver eval-max-sat --ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads 0 --ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize 60 --ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time 2\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy max-sat-by-separation --ucncs.max-sat-by-separation.solver eval-max-sat --ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads 0 --ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize 60 --ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time 2\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
diff --git a/doc-sources/user-guide/synthetic-data/synthetic-data.ipynb b/doc-sources/user-guide/synthetic-data/synthetic-data.ipynb
index f8c8631a..61afeb39 100644
--- a/doc-sources/user-guide/synthetic-data/synthetic-data.ipynb
+++ b/doc-sources/user-guide/synthetic-data/synthetic-data.ipynb
@@ -14,7 +14,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-problem 4 3 --random-seed 57\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classification-problem 4 3 --random-seed 57\n",
"kind: classification-problem\n",
"format_version: 1\n",
"criteria:\n",
@@ -63,7 +63,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classification-model problem.yml --random-seed 58 --model-type mrsort\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classification-model problem.yml --random-seed 58 --model-type mrsort\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
@@ -101,7 +101,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs generate classified-alternatives problem.yml model.yml 100 --random-seed 59 --misclassified-count 0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs generate classified-alternatives problem.yml model.yml 100 --random-seed 59 --misclassified-count 0\n",
"name,\"Criterion 1\",\"Criterion 2\",\"Criterion 3\",\"Criterion 4\",category\n",
"\"Alternative 1\",0.924035132,0.804616809,0.157870576,0.637420833,\"Best category\"\n",
"\"Alternative 2\",0.866915047,0.979161799,0.0841569453,0.397855282,\"Best category\"\n",
@@ -224,7 +224,7 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "# Reproduction command (with lincs version 1.1.0a6.dev0): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 60 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
+ "# Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 60 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0\n",
"kind: ncs-classification-model\n",
"format_version: 1\n",
"accepted_values:\n",
diff --git a/docs/.buildinfo b/docs/.buildinfo
index 0f7fa6c9..46c17ba1 100644
--- a/docs/.buildinfo
+++ b/docs/.buildinfo
@@ -1,4 +1,4 @@
# Sphinx build info version 1
# This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done.
-config: c3efb7cd4e9892bca8f9a10959dff7ff
+config: bf6a2a9ac0817ff6464d100acb2befb2
tags: 645f666f9bcd5a90fca523b33c5a78b7
diff --git a/docs/.doctrees/changelog.doctree b/docs/.doctrees/changelog.doctree
index 139dfba3..34869da9 100644
Binary files a/docs/.doctrees/changelog.doctree and b/docs/.doctrees/changelog.doctree differ
diff --git a/docs/.doctrees/environment.pickle b/docs/.doctrees/environment.pickle
index dac910f4..73ffd531 100644
Binary files a/docs/.doctrees/environment.pickle and b/docs/.doctrees/environment.pickle differ
diff --git a/docs/.doctrees/get-started.doctree b/docs/.doctrees/get-started.doctree
index d6d01506..85d982e5 100644
Binary files a/docs/.doctrees/get-started.doctree and b/docs/.doctrees/get-started.doctree differ
diff --git a/docs/.doctrees/python-api.doctree b/docs/.doctrees/python-api.doctree
index ebd84073..539e9c69 100644
Binary files a/docs/.doctrees/python-api.doctree and b/docs/.doctrees/python-api.doctree differ
diff --git a/docs/.doctrees/reference.doctree b/docs/.doctrees/reference.doctree
index a68b3e02..f1884d44 100644
Binary files a/docs/.doctrees/reference.doctree and b/docs/.doctrees/reference.doctree differ
diff --git a/docs/.doctrees/reference/lincs.doctree b/docs/.doctrees/reference/lincs.doctree
index 4f1ef614..843d41e0 100644
Binary files a/docs/.doctrees/reference/lincs.doctree and b/docs/.doctrees/reference/lincs.doctree differ
diff --git a/docs/.doctrees/user-guide.doctree b/docs/.doctrees/user-guide.doctree
index cb134dcf..4527df3d 100644
Binary files a/docs/.doctrees/user-guide.doctree and b/docs/.doctrees/user-guide.doctree differ
diff --git a/docs/README.html b/docs/README.html
index baf45229..323625cb 100644
--- a/docs/README.html
+++ b/docs/README.html
@@ -5,11 +5,11 @@
-
Contributors — lincs 1.1.0a5 documentation
+ Contributors — lincs 1.1.0a6 documentation
-
+
diff --git a/docs/_downloads/019271a03d05a599bcfb6d68c868c86a/python-api.ipynb b/docs/_downloads/019271a03d05a599bcfb6d68c868c86a/python-api.ipynb
new file mode 100644
index 00000000..81a889b6
--- /dev/null
+++ b/docs/_downloads/019271a03d05a599bcfb6d68c868c86a/python-api.ipynb
@@ -0,0 +1,2264 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "id": "03918549-cc28-44e3-9d3c-627c2a4e1683",
+ "metadata": {},
+ "source": [
+ "# The Python API"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "ef1a1243-f769-4cf1-9016-960e656e2e3e",
+ "metadata": {},
+ "source": [
+ "This document builds up on [our \"Get Started\" guide](https://mics-lab.github.io/lincs/get-started.html) and our [user guide](https://mics-lab.github.io/lincs/user-guide.html), and introduces *lincs*' Python API.\n",
+ "This API is more flexible, albeit more complex, than the command-line interface you've been using so far.\n",
+ "\n",
+ "If you're a Jupyter user, you can [download the notebook](python-api/python-api.ipynb) this document is based on."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "110a27c5-0f21-4c03-84d7-1947a86bb8fd",
+ "metadata": {},
+ "source": [
+ "## Do it again, in Python"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "a567f03d-64aa-4cbb-9ec5-d12a6ab4bec7",
+ "metadata": {},
+ "source": [
+ "First, lets do exactly the same thing as in our \"Get started\" guide, but using the Python API."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "77963196-9956-460c-989f-e7772f800a01",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from lincs import classification as lc"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "d85a8506-401f-4a3d-893c-996b11e99fe2",
+ "metadata": {},
+ "source": [
+ "Generate a synthetic classification problem:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "08948c5a-22e5-498a-96a7-9826d47e2f5d",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "problem = lc.generate_problem(criteria_count=4, categories_count=3, random_seed=40)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "0a9103e8-8884-4606-88ca-ed41b2b0972f",
+ "metadata": {},
+ "source": [
+ "The first difference with the command-line interface is the third argument to the call to `generate_problem`: it's the pseudo-random seed optionally passed by the `--random-seed` option on the command line. All pseudo-random seeds are mandatory in the Python API, so that you have full control of reproducibility. If you don't care about it, you can use `random.randrange(2**30)` to use pseudo-random pseudo-random seeds. (No typo here: the pseudo-random seeds are pseudo-random.)\n",
+ "\n",
+ "Generated problems are returned as Python objects of class `lincs.Problem`. You can print them:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "65d792e1-0720-45d8-b756-fe74537865b0",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: classification-problem\n",
+ "format_version: 1\n",
+ "criteria:\n",
+ " - name: Criterion 1\n",
+ " value_type: real\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 1\n",
+ " - name: Criterion 2\n",
+ " value_type: real\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 1\n",
+ " - name: Criterion 3\n",
+ " value_type: real\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 1\n",
+ " - name: Criterion 4\n",
+ " value_type: real\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 1\n",
+ "ordered_categories:\n",
+ " - name: Worst category\n",
+ " - name: Intermediate category 1\n",
+ " - name: Best category\n"
+ ]
+ }
+ ],
+ "source": [
+ "import sys\n",
+ "problem.dump(sys.stdout)"
+ ]
+ },
+ {
+ "attachments": {},
+ "cell_type": "markdown",
+ "id": "6875cdf0-9e37-4733-9b1d-11b474a09380",
+ "metadata": {},
+ "source": [
+ "Description functions generate a list of strings:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "4e37c394-a2e5-46ec-8813-5475f0a5c6f3",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "This a classification problem into 3 ordered categories named \"Worst category\", \"Intermediate category 1\" and \"Best category\".\n",
+ "The best category is \"Best category\" and the worst category is \"Worst category\".\n",
+ "There are 4 classification criteria (in no particular order).\n",
+ "Criterion \"Criterion 1\" takes real values between 0.0 and 1.0 included.\n",
+ "Higher values of \"Criterion 1\" are known to be better.\n",
+ "Criterion \"Criterion 2\" takes real values between 0.0 and 1.0 included.\n",
+ "Higher values of \"Criterion 2\" are known to be better.\n",
+ "Criterion \"Criterion 3\" takes real values between 0.0 and 1.0 included.\n",
+ "Higher values of \"Criterion 3\" are known to be better.\n",
+ "Criterion \"Criterion 4\" takes real values between 0.0 and 1.0 included.\n",
+ "Higher values of \"Criterion 4\" are known to be better.\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(\"\\n\".join(lc.describe_problem(problem)))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "5b170efd-eef5-4d4b-b435-b3c246a5fda6",
+ "metadata": {},
+ "source": [
+ "Generate a synthetic MR-Sort classification model, again with an explicit pseudo-random seed:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "ba5ba906-1457-4544-a754-fa33f30c19d5",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.255905151, 0.676961303]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.0551739037, 0.324553937]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.162252158, 0.673279881]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.0526000932, 0.598555863]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [0.147771254, 0.618687689, 0.406786472, 0.0960085914]\n",
+ " - *coalitions\n"
+ ]
+ }
+ ],
+ "source": [
+ "model = lc.generate_mrsort_model(problem, random_seed=41)\n",
+ "\n",
+ "model.dump(problem, sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b836036d-1da3-427b-8c78-c9b457fca7a9",
+ "metadata": {},
+ "source": [
+ "Visualization functions interface with [Matplotlib](https://matplotlib.org/):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "4ef64c1f-1f27-4864-b527-a21b0b8b9596",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import matplotlib.pyplot as plt"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "id": "3c2c0bb7-e738-4cd9-83cf-bd60e4774d58",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/png": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "axes = plt.subplots(1, 1, figsize=(6, 4), layout=\"constrained\")[1]\n",
+ "lc.visualize_model(problem, model, [], axes)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "3bee34aa-beec-41ba-813a-3cd582aee9b0",
+ "metadata": {},
+ "source": [
+ "Get the model's description:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "d2eadcf7-4565-45fe-bbc3-9e5cd7c9b73b",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "This is a MR-Sort (a.k.a. 1-Uc-NCS) model: an NCS model where the sufficient coalitions are specified using the same criterion weights for all boundaries.\n",
+ "The weights associated to each criterion are:\n",
+ " - Criterion \"Criterion 1\": 0.15\n",
+ " - Criterion \"Criterion 2\": 0.62\n",
+ " - Criterion \"Criterion 3\": 0.41\n",
+ " - Criterion \"Criterion 4\": 0.10\n",
+ "To get into an upper category, an alternative must be better than the following profiles on a set of criteria whose weights add up to at least 1:\n",
+ " - For category \"Intermediate category 1\": at least 0.26 on criterion \"Criterion 1\", at least 0.06 on criterion \"Criterion 2\", at least 0.16 on criterion \"Criterion 3\", and at least 0.05 on criterion \"Criterion 4\"\n",
+ " - For category \"Best category\": at least 0.68 on criterion \"Criterion 1\", at least 0.32 on criterion \"Criterion 2\", at least 0.67 on criterion \"Criterion 3\", and at least 0.60 on criterion \"Criterion 4\"\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(\"\\n\".join(lc.describe_model(problem, model)))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "00fab94b-22a7-41ae-8dfa-48263d3d8dfe",
+ "metadata": {},
+ "source": [
+ "Generate a synthetic learning set (with an explicit pseudo-random seed):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "id": "dac523f0-1340-4465-b487-7eca3bcd7c64",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "learning_set = lc.generate_alternatives(problem, model, alternatives_count=1000, random_seed=42)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "76b3a98d-e69c-4164-8ba0-557ff039bef9",
+ "metadata": {},
+ "source": [
+ "Dump it (in memory instead of on `sys.stdout` to print only the first few lines):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "id": "0d3fc508-480b-40dc-b7c9-1f7eb5637d8c",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "name,\"Criterion 1\",\"Criterion 2\",\"Criterion 3\",\"Criterion 4\",category\n",
+ "\"Alternative 1\",0.37454012,0.796543002,0.95071429,0.183434784,\"Best category\"\n",
+ "\"Alternative 2\",0.731993914,0.779690981,0.598658502,0.596850157,\"Intermediate category 1\"\n",
+ "\"Alternative 3\",0.156018645,0.445832759,0.15599452,0.0999749228,\"Worst category\"\n",
+ "\"Alternative 4\",0.0580836125,0.4592489,0.866176128,0.333708614,\"Best category\"\n",
+ "\"Alternative 5\",0.601114988,0.14286682,0.708072603,0.650888503,\"Intermediate category 1\"\n",
+ "...\n"
+ ]
+ }
+ ],
+ "source": [
+ "import io\n",
+ "f = io.StringIO()\n",
+ "learning_set.dump(problem, f)\n",
+ "print(\"\\n\".join(f.getvalue().splitlines()[:6] + ['...']))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "6e864665-f7b1-454e-ae4e-8b397e211266",
+ "metadata": {},
+ "source": [
+ "Visualize it:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "id": "3c2d9304-eeb3-4b56-8dcf-368e46117048",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/png": "",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "axes = plt.subplots(1, 1, figsize=(6, 4), layout=\"constrained\")[1]\n",
+ "lc.visualize_model(problem, model, learning_set.alternatives[:5], axes)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b625f1a5-ef14-4533-912c-cc281e269641",
+ "metadata": {},
+ "source": [
+ "Let's now train a new model from this synthetic learning set.\n",
+ "The command-line interface of `lincs learn classification-model` accepts quite a few options.\n",
+ "Most of them set up the strategies used for the learning, as described further in our [user guide](https://mics-lab.github.io/lincs/user-guide.html).\n",
+ "When using the Python API, you have to create these strategies yourself:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "c552db53-b77d-4011-9298-6e2504e4093c",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43)\n",
+ "profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)\n",
+ "weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)\n",
+ "profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)\n",
+ "breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)\n",
+ "termination_strategy = lc.TerminateAtAccuracy(learning_data, target_accuracy=len(learning_set.alternatives))"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e9eb59f7-3c47-429f-857a-2c88b1d2deb6",
+ "metadata": {},
+ "source": [
+ "Then create the learning itself:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "id": "df2de7ed-4a91-4dc9-b5b2-598a277c9a5a",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "learning = lc.LearnMrsortByWeightsProfilesBreed(\n",
+ " learning_data,\n",
+ " profiles_initialization_strategy,\n",
+ " weights_optimization_strategy,\n",
+ " profiles_improvement_strategy,\n",
+ " breeding_strategy,\n",
+ " termination_strategy,\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "8848f232-beda-41d0-9ba7-0889f15e6216",
+ "metadata": {},
+ "source": [
+ "And `.perform` it to create the learned `Model` object:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "id": "4f752442-f9ee-43ce-bd51-341b6e6a5081",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.339874953, 0.421424538]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.0556534864, 0.326433569]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.162616938, 0.67343241]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0.0878681168, 0.252649099]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [0, 1.01327896e-06, 0.999998987, 0]\n",
+ " - *coalitions\n"
+ ]
+ }
+ ],
+ "source": [
+ "learned_model = learning.perform()\n",
+ "learned_model.dump(problem, sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "a6f694fa-f820-4869-bde6-d46ff90cf9b6",
+ "metadata": {},
+ "source": [
+ "Create a testing set and classify it, taking notes of the accuracy of the new model on that testing set:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "id": "1fdb4fa6-f54e-4981-832c-f0175fc1c54b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(4, 2996)"
+ ]
+ },
+ "execution_count": 15,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "testing_set = lc.generate_alternatives(problem, model, alternatives_count=3000, random_seed=44)\n",
+ "classification_result = lc.classify_alternatives(problem, learned_model, testing_set)\n",
+ "classification_result.changed, classification_result.unchanged"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "44f38224-0b66-42c3-becb-7b44e3924305",
+ "metadata": {},
+ "source": [
+ "This covers what was done in our \"Get started\" guide.\n",
+ "As you can see the Python API is more verbose, but for good reasons: it's more powerful as you'll see in the next section."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e04a3a27-824d-41c6-9d0f-3ded09b205a8",
+ "metadata": {},
+ "source": [
+ "## Do more, with the Python API"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "3dd98560-201c-4634-9e9c-2c54d73ca0a8",
+ "metadata": {},
+ "source": [
+ "### Create classification objects"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "8f4aa99e-35a7-449c-bd00-4bea102390fa",
+ "metadata": {},
+ "source": [
+ "You don't have to use our pseudo-random generation functions; you can create `Problem`, `Model`, *etc.* instances yourself."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "4e95efaf-8714-4868-b7e1-aaecf4c21885",
+ "metadata": {},
+ "source": [
+ "#### Create a `Problem`"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "id": "ed9ed7fd-6dcd-4b0f-95de-5118a266056d",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: classification-problem\n",
+ "format_version: 1\n",
+ "criteria:\n",
+ " - name: Physics grade\n",
+ " value_type: integer\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 100\n",
+ " - name: Literature grade\n",
+ " value_type: enumerated\n",
+ " ordered_values: [f, e, d, c, b, a]\n",
+ "ordered_categories:\n",
+ " - name: Failed\n",
+ " - name: Passed\n",
+ " - name: Congratulations\n"
+ ]
+ }
+ ],
+ "source": [
+ "problem = lc.Problem(\n",
+ " criteria=[\n",
+ " lc.Criterion(\"Physics grade\", lc.Criterion.IntegerValues(lc.Criterion.PreferenceDirection.increasing, 0, 100)),\n",
+ " lc.Criterion(\"Literature grade\", lc.Criterion.EnumeratedValues([\"f\", \"e\", \"d\", \"c\", \"b\", \"a\"])),\n",
+ " ],\n",
+ " ordered_categories=[lc.Category(\"Failed\"), lc.Category(\"Passed\"), lc.Category(\"Congratulations\")],\n",
+ ")\n",
+ "\n",
+ "problem.dump(sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "60d24fd0-67ef-42ec-b76a-fa5729658e4d",
+ "metadata": {},
+ "source": [
+ "You can access all their attributes in code as well:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "id": "a0dc62c9-9f5a-4ffb-98aa-cae20a56492e",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "criterion = problem.criteria[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "id": "0ae00d4a-4890-436b-8e81-b0f113e37f9b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'Physics grade'"
+ ]
+ },
+ "execution_count": 18,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "criterion.name"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "6f7e7b92-d111-47aa-bd3d-02837b1392e0",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.ValueType.integer, False, True, False)"
+ ]
+ },
+ "execution_count": 19,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "criterion.value_type, criterion.is_real, criterion.is_integer, criterion.is_enumerated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "id": "35d2c1c0-9836-479c-a440-2f68ab35d050",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "values = criterion.integer_values"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "id": "fb85c12f-5cb3-49cc-9778-c7f702cbc11a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.PreferenceDirection.isotone, True, False)"
+ ]
+ },
+ "execution_count": 21,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "values.preference_direction, values.is_increasing, values.is_decreasing"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 22,
+ "id": "9c39cda6-5fa8-41c9-83fb-324148628d09",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(0, 100)"
+ ]
+ },
+ "execution_count": 22,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "values.min_value, values.max_value"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "id": "706551fd-25aa-4cfd-8778-a556ce99fc36",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "criterion = problem.criteria[1]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "id": "13843008-4dcc-4da7-8a4d-73a3b449a8f1",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'Literature grade'"
+ ]
+ },
+ "execution_count": 24,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "criterion.name"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 25,
+ "id": "2b3f21b9-39d8-41ef-bfaa-76106f31834b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.ValueType.enumerated, False, False, True)"
+ ]
+ },
+ "execution_count": 25,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "criterion.value_type, criterion.is_real, criterion.is_integer, criterion.is_enumerated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 26,
+ "id": "17b53592-8a71-4286-91da-0c92b941ad93",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "values = criterion.enumerated_values"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 27,
+ "id": "c71ea01f-0f6d-4a55-b462-9fafbf1013fa",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['f', 'e', 'd', 'c', 'b', 'a']"
+ ]
+ },
+ "execution_count": 27,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(values.ordered_values)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 28,
+ "id": "3d2c5f72-04c4-4a2e-8df0-23551beef9f1",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "5"
+ ]
+ },
+ "execution_count": 28,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "values.get_value_rank(value=\"a\")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e74adcad-1a37-4628-8435-077c7587c9dd",
+ "metadata": {},
+ "source": [
+ "#### Create a `Model`"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 29,
+ "id": "8142b595-1213-42ad-bfbe-c38f5f9113d7",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [50, 80]\n",
+ " - kind: thresholds\n",
+ " thresholds: [c, a]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [0.5, 0.5]\n",
+ " - *coalitions\n"
+ ]
+ }
+ ],
+ "source": [
+ "model = lc.Model(\n",
+ " problem,\n",
+ " accepted_values=[\n",
+ " lc.AcceptedValues(lc.AcceptedValues.IntegerThresholds([50, 80])),\n",
+ " lc.AcceptedValues(lc.AcceptedValues.EnumeratedThresholds([\"c\", \"a\"])),\n",
+ " ],\n",
+ " sufficient_coalitions=[\n",
+ " lc.SufficientCoalitions(lc.SufficientCoalitions.Weights([0.5, 0.5])),\n",
+ " lc.SufficientCoalitions(lc.SufficientCoalitions.Weights([0.5, 0.5])),\n",
+ " ],\n",
+ ")\n",
+ "\n",
+ "model.dump(problem, sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 30,
+ "id": "4d9286ed-1fde-42ea-854b-3ef3cd532f82",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "accepted = model.accepted_values[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 31,
+ "id": "161f926c-f9e5-4bc7-9382-c069d10458d8",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.ValueType.integer, False, True, False)"
+ ]
+ },
+ "execution_count": 31,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "accepted.value_type, accepted.is_real, accepted.is_integer, accepted.is_enumerated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 32,
+ "id": "c1298109-a0e9-4660-bd49-c325c0222d72",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.Kind.thresholds, True)"
+ ]
+ },
+ "execution_count": 32,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "accepted.kind, accepted.is_thresholds"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 33,
+ "id": "767b2049-aad2-45a1-9bfc-1e3f7273be46",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[50, 80]"
+ ]
+ },
+ "execution_count": 33,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(accepted.integer_thresholds.thresholds)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 34,
+ "id": "36256e92-7b2a-4131-b088-35f52dae6dd3",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "accepted = model.accepted_values[1]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 35,
+ "id": "62c1aa27-cbc8-4032-9282-e1acf76ffa01",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.ValueType.enumerated, False, False, True)"
+ ]
+ },
+ "execution_count": 35,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "accepted.value_type, accepted.is_real, accepted.is_integer, accepted.is_enumerated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 36,
+ "id": "ffc03b33-b0cc-4211-b8f3-d0dbedc8131a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.Kind.thresholds, True)"
+ ]
+ },
+ "execution_count": 36,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "accepted.kind, accepted.is_thresholds"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 37,
+ "id": "26a4d2eb-5d2b-42a3-8348-da1d16b5303f",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['c', 'a']"
+ ]
+ },
+ "execution_count": 37,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(accepted.enumerated_thresholds.thresholds)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 38,
+ "id": "4690357c-2082-420e-b294-0010ef46f662",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "sufficient = model.sufficient_coalitions[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 39,
+ "id": "bc0e16b6-ac03-4f81-9c03-79f6c6c91a8b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.Kind.weights, True, False)"
+ ]
+ },
+ "execution_count": 39,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "sufficient.kind, sufficient.is_weights, sufficient.is_roots"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 40,
+ "id": "6fb81ac9-3f62-4f90-874f-de827d8d761a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[0.5, 0.5]"
+ ]
+ },
+ "execution_count": 40,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(sufficient.weights.criterion_weights)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "34adef06-2a98-4278-976f-0bfbcdae399b",
+ "metadata": {},
+ "source": [
+ "#### Create (classified) `Alternatives`"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 41,
+ "id": "44429b29-e039-46ab-b5ad-e2939a729406",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "alternatives = lc.Alternatives(problem, [\n",
+ " lc.Alternative(\n",
+ " \"Unclassified alternative\",\n",
+ " [\n",
+ " lc.Performance(lc.Performance.Integer(50)),\n",
+ " lc.Performance(lc.Performance.Enumerated(\"c\")),\n",
+ " ],\n",
+ " None\n",
+ " ),\n",
+ " lc.Alternative(\n",
+ " \"Classified alternative\",\n",
+ " [\n",
+ " lc.Performance(lc.Performance.Integer(90)),\n",
+ " lc.Performance(lc.Performance.Enumerated(\"a\")),\n",
+ " ],\n",
+ " 2\n",
+ " ),\n",
+ "])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 42,
+ "id": "55a42ccb-27e8-46ea-89c5-3b2828cb34e8",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "alternative = alternatives.alternatives[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 43,
+ "id": "2dfdf211-2120-4098-a84b-c3b71ac7b8c7",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "True"
+ ]
+ },
+ "execution_count": 43,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "alternative.category_index is None"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 44,
+ "id": "3ddd8143-0374-4e5d-9d97-8673907062cd",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "performance = alternative.profile[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 45,
+ "id": "168d930a-f8e9-4777-b489-7e3214b2fc54",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(liblincs.ValueType.integer, False, True, False)"
+ ]
+ },
+ "execution_count": 45,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "performance.value_type, performance.is_real, performance.is_integer, performance.is_enumerated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 46,
+ "id": "77e19ca9-1fa5-4a4c-99b9-18be4b660596",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "50"
+ ]
+ },
+ "execution_count": 46,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "performance.integer.value"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 47,
+ "id": "95ee2b32-0210-4b77-a0b6-66812bcb1e45",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'Congratulations'"
+ ]
+ },
+ "execution_count": 47,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "problem.ordered_categories[alternatives.alternatives[1].category_index].name"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "14c1121f-8cfc-4df8-ae73-1574970a382f",
+ "metadata": {},
+ "source": [
+ "### Clone classification objects"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "269d4ce1-75de-4107-b89d-3d86787fa6aa",
+ "metadata": {},
+ "source": [
+ "Just use [`copy.deepcopy`](https://docs.python.org/3/library/copy.html#copy.deepcopy):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 48,
+ "id": "b3927282-a8d3-4f91-959a-9c4d23e5f473",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import copy\n",
+ "\n",
+ "copied_problem = copy.deepcopy(problem)\n",
+ "copied_model = copy.deepcopy(model)\n",
+ "copied_alternatives = copy.deepcopy(alternatives)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "5b97e1f1-00b2-4274-9eb3-145cab40542d",
+ "metadata": {},
+ "source": [
+ "This is especially useful *e.g.* if you want to identify alternatives that are classified differently by two models, because `lc.classify_alternatives` mutates the alternatives: clone the `Alternatives`, classify the copy and iterate over the [`zip`](https://docs.python.org/3/library/functions.html#zip) of both `Alternatives`, comparing their `.category_index`."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "97c52075-e6df-4763-ac72-7ea8e3adebe5",
+ "metadata": {},
+ "source": [
+ "### Serialize classification objects"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "f04191af-4bce-4328-91e8-eb5292d26ebd",
+ "metadata": {},
+ "source": [
+ "#### In YAML and CSV like the command-line\n",
+ "\n",
+ "(and the upcomming C++ API)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "395bbfef-ce1a-4d56-81d5-fa9bcbbbd410",
+ "metadata": {},
+ "source": [
+ "Classification objects have a `.dump` method, and their classes have a static `.load` method that accept file-like objects.\n",
+ "\n",
+ "We've used them above to print classification objects to `sys.stdout`. Here is an example of how to use them with actual files:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 49,
+ "id": "b76a3046-5e1c-4ad8-9b00-4dc24486a4d9",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "with open(\"problem.yml\", \"w\") as f:\n",
+ " problem.dump(f)\n",
+ "\n",
+ "with open(\"model.yml\", \"w\") as f:\n",
+ " model.dump(problem, f)\n",
+ "\n",
+ "with open(\"alternatives.csv\", \"w\") as f:\n",
+ " alternatives.dump(problem, f)\n",
+ "\n",
+ "with open(\"problem.yml\") as f:\n",
+ " problem = lc.Problem.load(f)\n",
+ "\n",
+ "with open(\"model.yml\") as f:\n",
+ " model = lc.Model.load(problem, f)\n",
+ "\n",
+ "with open(\"alternatives.csv\") as f:\n",
+ " alternatives = lc.Alternatives.load(problem, f)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "87932b00-021c-4389-87ed-690d1f30effb",
+ "metadata": {},
+ "source": [
+ "And here with in-memory [io](https://docs.python.org/3/library/io.html) objects:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 50,
+ "id": "8844542e-b8bf-4a6e-b370-828d6e05c3ab",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: classification-problem\n",
+ "format_version: 1\n",
+ "criteria:\n",
+ " - name: Physics grade\n",
+ " value_type: integer\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 100\n",
+ " - name: Literature grade\n",
+ " value_type: enumerated\n",
+ " ordered_values: [f, e, d, c, b, a]\n",
+ "ordered_categories:\n",
+ " - name: Failed\n",
+ " - name: Passed\n",
+ " - name: Congratulations\n",
+ "\n"
+ ]
+ }
+ ],
+ "source": [
+ "f = io.StringIO()\n",
+ "problem.dump(f)\n",
+ "s = f.getvalue()\n",
+ "print(s)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 51,
+ "id": "b5fe484c-7d80-40ea-9098-0b2776833510",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "f = io.StringIO(s)\n",
+ "problem = lc.Problem.load(f)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "784d7f86-0b02-4bd6-a4a9-280232b05fde",
+ "metadata": {},
+ "source": [
+ "#### Using the Python-specific `pickle` module"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "57f2a0dc-608d-4db8-b3b6-ac0b4d198a6d",
+ "metadata": {},
+ "source": [
+ "Classification objects simply support [pickling](https://docs.python.org/3/library/pickle.html) and unpickling. We recommend using the YAML and CSV formats whenever possible because they are not tied to the Python language (or the *lincs* library for that matter)."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 52,
+ "id": "1e1b8f9d-c82d-4525-b094-13a55c445ff0",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: classification-problem\n",
+ "format_version: 1\n",
+ "criteria:\n",
+ " - name: Physics grade\n",
+ " value_type: integer\n",
+ " preference_direction: increasing\n",
+ " min_value: 0\n",
+ " max_value: 100\n",
+ " - name: Literature grade\n",
+ " value_type: enumerated\n",
+ " ordered_values: [f, e, d, c, b, a]\n",
+ "ordered_categories:\n",
+ " - name: Failed\n",
+ " - name: Passed\n",
+ " - name: Congratulations\n"
+ ]
+ }
+ ],
+ "source": [
+ "import pickle\n",
+ "\n",
+ "pickle.loads(pickle.dumps(problem)).dump(sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "eba4a737-e844-44d3-9158-a63a7fdefc3d",
+ "metadata": {},
+ "source": [
+ "Note however that learning objects (*e.g.* instances of `LearnMrsortByWeightsProfilesBreed`) are *not* picklable."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "c33628cc-d611-4ed3-954d-0b7bbc04c698",
+ "metadata": {},
+ "source": [
+ "### Customize the model visualization"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "132da858-692d-46b3-b7ad-f10c6bb744fd",
+ "metadata": {},
+ "source": [
+ "@todo(Documentation, v1.1) Write this section. Explain that `visualize_model` is written in terms of the public Python API and can be used as a base (*i.e.* copy-pasted)."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e8556878-23a0-45d2-964f-f82f1a217b1d",
+ "metadata": {},
+ "source": [
+ "### Create your own learning strategies"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e5326968-1069-4c3f-b1a1-8823c7956e3b",
+ "metadata": {},
+ "source": [
+ "@todo(Documentation, v1.1) Introduce this section."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 53,
+ "id": "de3701e6-784a-4fb8-84cf-aa65ecc26d71",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "problem = lc.Problem(\n",
+ " [\n",
+ " lc.Criterion(\"Criterion 1\", lc.Criterion.RealValues(lc.Criterion.PreferenceDirection.decreasing, 0, 10)),\n",
+ " lc.Criterion(\"Criterion 2\", lc.Criterion.IntegerValues(lc.Criterion.PreferenceDirection.increasing, 0, 100)),\n",
+ " lc.Criterion(\"Criterion 3\", lc.Criterion.EnumeratedValues([\"F\", \"E\", \"D\", \"C\", \"B\", \"A\"])),\n",
+ " ],\n",
+ " [lc.Category(\"Bad\"), lc.Category(\"Medium\"), lc.Category(\"Good\")],\n",
+ ")\n",
+ "model = lc.generate_mrsort_model(problem, random_seed=42)\n",
+ "learning_set = lc.generate_alternatives(problem, model, alternatives_count=1000, random_seed=43)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "89022cc0-86d2-41ae-9492-60ce1623425f",
+ "metadata": {},
+ "source": [
+ "#### `LearningData`"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "6b3b861f-f16a-4574-9956-c6087482e302",
+ "metadata": {},
+ "source": [
+ "First, let's get more familiar with the `LearningData`:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 54,
+ "id": "dec0c847-98ac-42f2-a2ee-1fd0a4c9ac0e",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "dc4244fd-f862-4ba9-8d6f-6e669c273530",
+ "metadata": {},
+ "source": [
+ "It contains two families of attributes."
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "d611a8bc-b4d7-4003-8d4d-f1d7835d3a4f",
+ "metadata": {},
+ "source": [
+ "##### Input data"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "6e40ad12-e93b-40a9-96a9-3b3e7c717152",
+ "metadata": {},
+ "source": [
+ "The first one is about the problem and learning set. These attributes never change. First, the counts:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 55,
+ "id": "5e6d7c88-af1e-474f-b631-8ff6d84ab60e",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(3, 3, 2, 1000)"
+ ]
+ },
+ "execution_count": 55,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "(learning_data.criteria_count, learning_data.categories_count, learning_data.boundaries_count, learning_data.alternatives_count)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "a718bf27-98dc-4d60-a824-7baac5f607cb",
+ "metadata": {},
+ "source": [
+ "The learning set is pre-processed in the `LearningData` so that learning algorithms don't have to manipulate the different type of criterion values. In the `LearningData`, we keep only the ranks of the performances of each alternative in the learning set. The learning set is also destructured into a few arrays. Here are the attributes that describe this pre-processed learning set:\n",
+ "\n",
+ "The number of distinct values actually seen for each criterion (including the min and max values for numerical criteria):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 56,
+ "id": "c2531e9f-a957-4903-9e77-ad7ee513ca63",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[1002, 101, 6]"
+ ]
+ },
+ "execution_count": 56,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(learning_data.values_counts) # Indexed by [criterion_index]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 57,
+ "id": "b5f7c642-475b-4986-b0f1-0168fa169476",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(1002, 6)"
+ ]
+ },
+ "execution_count": 57,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "(learning_data.values_counts[0], learning_data.values_counts[learning_data.criteria_count - 1])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "e0eb4ea9-f857-479e-b1c9-a87c44e151bf",
+ "metadata": {},
+ "source": [
+ "We see that the learning data knows 1002 values for the real-valued criterion. This is usual as it's rare that two floating point values are exactly equal, so the 1000 alternatives have distinct values, and the min and max are two more values. The learning data contains 101 values for the integer-valued criterion, meaning that the alternatives in the learning set do actually cover the whole set of possible values. And similarly, 6 values for the enumerated criterion.\n",
+ "\n",
+ "For each criterion, the ranks of the performance of each alternative:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 58,
+ "id": "085a36fa-7c82-43da-aa29-1687b693dcb2",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[[883, 900, 753, 216, 365, 410, 302, 852, 738, 45, '...'],\n",
+ " [50, 13, 17, 86, 4, 2, 25, 81, 47, 87, '...'],\n",
+ " [3, 0, 1, 0, 3, 3, 2, 0, 0, 3, '...']]"
+ ]
+ },
+ "execution_count": 58,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[list(v)[:10] + ['...'] for v in learning_data.performance_ranks] # Indexed by [criterion_index][alternative_index]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 59,
+ "id": "e416f0d9-8077-4215-852b-1e01308f9c5d",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(883, 3)"
+ ]
+ },
+ "execution_count": 59,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "(learning_data.performance_ranks[0][0], learning_data.performance_ranks[learning_data.criteria_count - 1][learning_data.alternatives_count - 1])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "544df6c0-be0c-41b7-ac0e-11a31c5b7be8",
+ "metadata": {},
+ "source": [
+ "The assignment of each alternative, *i.e.* the index of its category:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 60,
+ "id": "26d14839-e77c-4c6b-9957-86d8c8f2d4b4",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[2, 2, 2, 0, 1, 1, 1, 2, 2, 0, '...']"
+ ]
+ },
+ "execution_count": 60,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(learning_data.assignments)[:10] + ['...'] # Indexed by [alternative_index]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 61,
+ "id": "16d76309-1578-45ed-bf65-1559545e1908",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(2, 2)"
+ ]
+ },
+ "execution_count": 61,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "(learning_data.assignments[0], learning_data.assignments[learning_data.alternatives_count - 1])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "bf4de4df-f675-44e1-a908-a3554dd08083",
+ "metadata": {},
+ "source": [
+ "##### In-progress data"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "bbeccc8f-4b25-4029-a5fb-76d6257c4df7",
+ "metadata": {},
+ "source": [
+ "The second family of attributes is about the WeightsProfilesBreed algorithm itself.\n",
+ "\n",
+ "The `LearningData` contains several \"in progress\" models. Their number is constant:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 62,
+ "id": "e4ca254f-3629-4b3d-9811-745d054fc344",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "9"
+ ]
+ },
+ "execution_count": 62,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "learning_data.models_count"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "9807dc89-c81b-4e87-8671-07bce5a79edb",
+ "metadata": {},
+ "source": [
+ "Each model comes with a uniform random bits generator (URBG for short):"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 63,
+ "id": "cbd965fe-19b5-41b5-8428-17b59b5c9d3b",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['',\n",
+ " '',\n",
+ " '',\n",
+ " '',\n",
+ " '',\n",
+ " '',\n",
+ " '',\n",
+ " '',\n",
+ " '']"
+ ]
+ },
+ "execution_count": 63,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[str(urbg)[:43] + '>' for urbg in learning_data.urbgs] # Indexed by [model_index]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b6e0e786-1a6f-4b1f-b173-c91398d0e3f4",
+ "metadata": {},
+ "source": [
+ "This lets heuristic strategies operate in parallel on models and still produce deterministic results. URBGs are callable to get the next pseudo-random integer:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 64,
+ "id": "79f1d0ca-68b0-4d2b-aabb-5191cac23c74",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[494155588,\n",
+ " 870190228,\n",
+ " 2450414687,\n",
+ " 641676058,\n",
+ " 661088198,\n",
+ " 363471047,\n",
+ " 1448606581,\n",
+ " 1348129397,\n",
+ " 2542538607]"
+ ]
+ },
+ "execution_count": 64,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[r() for r in learning_data.urbgs]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "485e3ba4-f926-402a-b4ae-32363861a132",
+ "metadata": {},
+ "source": [
+ "WPB learning is iterative, and the `iteration_index` is stored in the learning data. It starts at zero and tells you the current iteration:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 65,
+ "id": "aa17bb83-d47f-42bc-a0d1-da6d201d4ad2",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0"
+ ]
+ },
+ "execution_count": 65,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "learning_data.iteration_index"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "acaa99a2-e744-4063-8d2e-90aa24bc92b9",
+ "metadata": {},
+ "source": [
+ "The remaining attributes are modified at each iteration, and start uninitialized. For this presentation, we'll first run one iteration of WPB so that their values make sense."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 66,
+ "id": "72a72efe-2404-4f92-8ffc-cee6fbbeced1",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43)\n",
+ "profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)\n",
+ "weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)\n",
+ "profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)\n",
+ "breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)\n",
+ "termination_strategy = lc.TerminateAfterIterations(learning_data, max_iterations_count=1)\n",
+ "\n",
+ "lc.LearnMrsortByWeightsProfilesBreed(\n",
+ " learning_data,\n",
+ " profiles_initialization_strategy,\n",
+ " weights_optimization_strategy,\n",
+ " profiles_improvement_strategy,\n",
+ " breeding_strategy,\n",
+ " termination_strategy,\n",
+ ").perform()\n",
+ "\n",
+ "assert(learning_data.iteration_index == 0)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b3a8e44f-ced5-4e34-bdbe-0cd33a854348",
+ "metadata": {},
+ "source": [
+ "Its `model_indexes` contains indexes of models in increasing order of accuracy."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 67,
+ "id": "e9f9a2e9-dbc3-444a-a0f3-4b090dd46ca5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[1, 5, 4, 8, 3, 6, 2, 0, 7]"
+ ]
+ },
+ "execution_count": 67,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(learning_data.model_indexes)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b7f78a52-a965-4872-b6cf-a6fb45dd597d",
+ "metadata": {},
+ "source": [
+ "Its `accuracies` attribute holds the accuracy of each model. They are stored as the count of correctly-classified alternatives, between 0 and `alternatives_count` included:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 68,
+ "id": "504796aa-7aa1-424f-a458-e9e1df7c550f",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[728, 593, 725, 671, 637, 609, 676, 833, 640]"
+ ]
+ },
+ "execution_count": 68,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(learning_data.accuracies) # Indexed by model_index"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "b5b5d24e-d8f0-45e0-adda-c4978a943872",
+ "metadata": {},
+ "source": [
+ "If you iterate the `accuracies` in the order of `model_indexes`, they are sorted:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 69,
+ "id": "dccb02f0-4eff-4452-b7f4-15d71b5db16a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "True"
+ ]
+ },
+ "execution_count": 69,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[learning_data.accuracies[index] for index in learning_data.model_indexes] == sorted(learning_data.accuracies)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "d80a063d-1456-4ae6-a57a-96a28bfda3a1",
+ "metadata": {},
+ "source": [
+ "@todo(Documentation, v1.1) Introduce profiles"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 70,
+ "id": "85b36a2f-39c0-45df-8648-083d0a85071c",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[[[124, 9, 0], [633, 9, 3]],\n",
+ " [[492, 8, 1], [965, 8, 4]],\n",
+ " [[268, 15, 0], [506, 54, 3]],\n",
+ " [[230, 8, 1], [272, 26, 4]],\n",
+ " [[201, 1, 1], [201, 2, 3]],\n",
+ " [[86, 64, 0], [86, 99, 0]],\n",
+ " [[223, 60, 2], [310, 80, 5]],\n",
+ " [[235, 20, 2], [595, 20, 3]],\n",
+ " [[261, 52, 0], [262, 52, 3]]]"
+ ]
+ },
+ "execution_count": 70,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[[list(vv) for vv in v] for v in learning_data.profile_ranks] # Indexed by [model_index][boundary_index][criterion_index]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "fc0441fa-244f-4ed3-ad57-cf8cbea3ecf4",
+ "metadata": {},
+ "source": [
+ "@todo(Documentation, v1.1) Introduce weights"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 71,
+ "id": "382c323a-f9ac-437a-8a28-3472ca341efa",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[[1.0132789611816406e-06, 0.9999989867210388, 1.0132789611816406e-06],\n",
+ " [0.9999989867210388, 0.9999989867210388, 1.0132789611816406e-06],\n",
+ " [1.0, 0.0, 0.9999989867210388],\n",
+ " [0.5000004768371582, 0.4999994933605194, 0.4999994933605194],\n",
+ " [1.0132789611816406e-06, 0.9999989867210388, 0.0],\n",
+ " [0.9999989867210388, 0.0, 1.0132789611816406e-06],\n",
+ " [1.0, 0.0, 0.0],\n",
+ " [1.0, 0.9999989867210388, 1.0132789611816406e-06],\n",
+ " [0.9999989867210388, 0.0, 0.9999989867210388]]"
+ ]
+ },
+ "execution_count": 71,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "[list(v) for v in learning_data.weights] # Indexed by [model_index][criterion_index]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "6b4697a0-1ef4-4702-a261-fd909c29f08a",
+ "metadata": {},
+ "source": [
+ "#### `Observer`"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "99070e74-7640-4e05-a0e0-8066f304eb83",
+ "metadata": {},
+ "source": [
+ "With this better understanding of `LearningData`, let's write our own `Observer` strategy. It's arguably the simplest to starts with, because it's not expected to *change* the `LearningData`.\n",
+ "\n",
+ "To start as simple as possible, lets reproduce the behavior of the `--...-verbose` flag on the command line, by creating an observer that just prints the best accuracy at each step.\n",
+ "\n",
+ "`Observer` strategies must define two methods to be called by the learning algorithm: `after_iteration`, to be called at the end of each iteration, after the breeding of models is done, and `before_return`, to be called just before the final model is returned."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 72,
+ "id": "11b11239-c0fb-4755-a61f-83e4a9a57494",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "class VerboseObserver(lc.LearnMrsortByWeightsProfilesBreed.Observer):\n",
+ " def __init__(self, learning_data):\n",
+ " super().__init__()\n",
+ " self.learning_data = learning_data\n",
+ "\n",
+ " def after_iteration(self):\n",
+ " print(f\"Best accuracy (after {self.learning_data.iteration_index + 1} iterations): {self.learning_data.get_best_accuracy()}\")\n",
+ "\n",
+ " def before_return(self):\n",
+ " print(f\"Final accuracy (after {self.learning_data.iteration_index + 1} iterations): {self.learning_data.get_best_accuracy()}\")"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "f69b75d0-3a80-4c80-b7aa-c2ffe3b58973",
+ "metadata": {},
+ "source": [
+ "We can now pass it to a learning and perform that learning to observe its effects:"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 73,
+ "id": "8925d4ec-5716-428b-b895-9a34be3216ce",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Best accuracy (after 1 iterations): 938\n",
+ "Best accuracy (after 2 iterations): 992\n",
+ "Best accuracy (after 3 iterations): 997\n",
+ "Best accuracy (after 4 iterations): 997\n",
+ "Best accuracy (after 5 iterations): 997\n",
+ "Best accuracy (after 6 iterations): 997\n",
+ "Best accuracy (after 7 iterations): 997\n",
+ "Best accuracy (after 8 iterations): 999\n",
+ "Final accuracy (after 9 iterations): 1000\n"
+ ]
+ }
+ ],
+ "source": [
+ "profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)\n",
+ "weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)\n",
+ "profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)\n",
+ "breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)\n",
+ "termination_strategy = lc.TerminateAtAccuracy(learning_data, target_accuracy=len(learning_set.alternatives))\n",
+ "observer = VerboseObserver(learning_data)\n",
+ "\n",
+ "learned_model = lc.LearnMrsortByWeightsProfilesBreed(\n",
+ " learning_data,\n",
+ " profiles_initialization_strategy,\n",
+ " weights_optimization_strategy,\n",
+ " profiles_improvement_strategy,\n",
+ " breeding_strategy,\n",
+ " termination_strategy,\n",
+ " [observer],\n",
+ ").perform()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "a558c178-0ba7-49fe-b7c0-95a89e13ff0b",
+ "metadata": {},
+ "source": [
+ "Now let's do something slightly more complicated: our goal for `IntermediatesObserver` is to keep track of the best model so far at different times during the learning. Specifically, we want to keep the models at iterations 1, 2, 4, 8, *etc.*."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 74,
+ "id": "b953eeba-6185-4432-b6ae-a262d88a635c",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [7.7909708, 4.06594753]\n",
+ " - kind: thresholds\n",
+ " thresholds: [20, 20]\n",
+ " - kind: thresholds\n",
+ " thresholds: [D, C]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [1, 0.999998987, 1.01327896e-06]\n",
+ " - *coalitions\n",
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [7.95116329, 3.89878368]\n",
+ " - kind: thresholds\n",
+ " thresholds: [0, 21]\n",
+ " - kind: thresholds\n",
+ " thresholds: [C, B]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [1, 0, 1]\n",
+ " - *coalitions\n",
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [7.96338844, 3.82566905]\n",
+ " - kind: thresholds\n",
+ " thresholds: [73, 84]\n",
+ " - kind: thresholds\n",
+ " thresholds: [B, B]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [1, 0, 1]\n",
+ " - *coalitions\n",
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [7.96338844, 3.74707603]\n",
+ " - kind: thresholds\n",
+ " thresholds: [94, 99]\n",
+ " - kind: thresholds\n",
+ " thresholds: [B, B]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [1, 0, 1]\n",
+ " - *coalitions\n",
+ "kind: ncs-classification-model\n",
+ "format_version: 1\n",
+ "accepted_values:\n",
+ " - kind: thresholds\n",
+ " thresholds: [7.95116329, 3.74707603]\n",
+ " - kind: thresholds\n",
+ " thresholds: [94, 99]\n",
+ " - kind: thresholds\n",
+ " thresholds: [B, B]\n",
+ "sufficient_coalitions:\n",
+ " - &coalitions\n",
+ " kind: weights\n",
+ " criterion_weights: [1, 0, 1]\n",
+ " - *coalitions\n"
+ ]
+ }
+ ],
+ "source": [
+ "import math\n",
+ "\n",
+ "class IntermediatesObserver(lc.LearnMrsortByWeightsProfilesBreed.Observer):\n",
+ " def __init__(self, problem, learning_data):\n",
+ " super().__init__()\n",
+ " self.problem = problem\n",
+ " self.learning_data = learning_data\n",
+ " self.intermediate_models = []\n",
+ "\n",
+ " def after_iteration(self):\n",
+ " if math.log2(self.learning_data.iteration_index + 1).is_integer():\n",
+ " self.intermediate_models.append(self.learning_data.get_best_model())\n",
+ "\n",
+ " def before_return(self):\n",
+ " pass\n",
+ "\n",
+ "learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43) # Do *not* reuse the same `LearningData` for several learnings\n",
+ "profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)\n",
+ "weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)\n",
+ "profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)\n",
+ "breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)\n",
+ "termination_strategy = lc.TerminateAtAccuracy(learning_data, target_accuracy=len(learning_set.alternatives))\n",
+ "observer = IntermediatesObserver(problem, learning_data)\n",
+ "\n",
+ "final_model = lc.LearnMrsortByWeightsProfilesBreed(\n",
+ " learning_data,\n",
+ " profiles_initialization_strategy,\n",
+ " weights_optimization_strategy,\n",
+ " profiles_improvement_strategy,\n",
+ " breeding_strategy,\n",
+ " termination_strategy,\n",
+ " [observer],\n",
+ ").perform()\n",
+ "\n",
+ "for model in observer.intermediate_models:\n",
+ " model.dump(problem, sys.stdout)\n",
+ "final_model.dump(problem, sys.stdout)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "76bbaf16-0934-4cb2-b969-8a4f3f8cdf3e",
+ "metadata": {},
+ "source": [
+ "#### Other strategies"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "d3754888-d110-494f-9bb5-846cd749eb5a",
+ "metadata": {},
+ "source": [
+ "@todo(Documentation, v1.1) Write this section"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 75,
+ "id": "2182489b-a451-4e97-9045-0d65af27e0f1",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "class SillyWeightsStrategy(lc.LearnMrsortByWeightsProfilesBreed.WeightsOptimizationStrategy):\n",
+ " pass"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 76,
+ "id": "418ed6c6-2a36-438f-be7e-e47368523bf4",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "class SillyProfilesStrategy(lc.LearnMrsortByWeightsProfilesBreed.ProfilesImprovementStrategy):\n",
+ " pass"
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.8.10"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/docs/_sources/changelog.rst.txt b/docs/_sources/changelog.rst.txt
index 7cf43e09..9de05d67 100644
--- a/docs/_sources/changelog.rst.txt
+++ b/docs/_sources/changelog.rst.txt
@@ -4,6 +4,23 @@
Changelog
=========
+Version 1.1.0a6 (2024-02-06)
+============================
+
+- **Breaking** Rename ``max_iteration_index`` to ``max_iterations_count`` in ``...TerminateAfterIterations.__init__``
+- Make the Python API guide Jupyter Notebook downloadable
+- Expose all attributes of ``WPB.LearningData``; start to document them in our Python API guide
+- Expose parameters of EvalMaxSAT in our API and command-line interface (see ``lincs learn classification-model --help``):
+
+ - ``--ucncs.max-sat-by-separation.solver`` (for consistency, always ``"eval-max-sat"`` for now)
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads``
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize``
+ - ``--ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time``
+ - ``--ucncs.max-sat-by-coalitions.solver`` (for consistency, always ``"eval-max-sat"`` for now)
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.nb-minimize-threads``
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.timeout-fast-minimize``
+ - ``--ucncs.max-sat-by-coalitions.eval-max-sat.coef-minimize-time``
+
Version 1.1.0a5 (2024-02-01)
============================
diff --git a/docs/_sources/get-started.rst.txt b/docs/_sources/get-started.rst.txt
index 39c40b47..56f31a55 100644
--- a/docs/_sources/get-started.rst.txt
+++ b/docs/_sources/get-started.rst.txt
@@ -75,7 +75,7 @@ The generated ``problem.yml`` should look like:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a5): lincs generate classification-problem 4 3 --random-seed 40
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classification-problem 4 3 --random-seed 40
kind: classification-problem
format_version: 1
criteria:
@@ -146,7 +146,7 @@ It should look like:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a5): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classification-model problem.yml --random-seed 41 --model-type mrsort
kind: ncs-classification-model
format_version: 1
accepted_values:
@@ -219,7 +219,7 @@ It should start with something like this, and contain 1000 alternatives:
.. code:: text
- # Reproduction command (with lincs version 1.1.0a5): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0
+ # Reproduction command (with lincs version 1.1.0a6): lincs generate classified-alternatives problem.yml model.yml 1000 --random-seed 42 --misclassified-count 0
name,"Criterion 1","Criterion 2","Criterion 3","Criterion 4",category
"Alternative 1",0.37454012,0.796543002,0.95071429,0.183434784,"Best category"
"Alternative 2",0.731993914,0.779690981,0.598658502,0.596850157,"Intermediate category 1"
@@ -255,7 +255,7 @@ so it is numerically different:
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a5): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0
+ # Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type mrsort --mrsort.strategy weights-profiles-breed --mrsort.weights-profiles-breed.models-count 9 --mrsort.weights-profiles-breed.accuracy-heuristic.random-seed 43 --mrsort.weights-profiles-breed.initialization-strategy maximize-discrimination-per-criterion --mrsort.weights-profiles-breed.weights-strategy linear-program --mrsort.weights-profiles-breed.linear-program.solver glop --mrsort.weights-profiles-breed.profiles-strategy accuracy-heuristic --mrsort.weights-profiles-breed.accuracy-heuristic.processor cpu --mrsort.weights-profiles-breed.breed-strategy reinitialize-least-accurate --mrsort.weights-profiles-breed.reinitialize-least-accurate.portion 0.5 --mrsort.weights-profiles-breed.target-accuracy 1.0
kind: ncs-classification-model
format_version: 1
accepted_values:
diff --git a/docs/_sources/python-api.md.txt b/docs/_sources/python-api.md.txt
index 279d8633..fa1d042e 100644
--- a/docs/_sources/python-api.md.txt
+++ b/docs/_sources/python-api.md.txt
@@ -5,6 +5,8 @@
This document builds up on {doc}`our "Get Started" guide ` and our {doc}`user guide `, and introduces *lincs*' Python API.
This API is more flexible, albeit more complex, than the command-line interface you've been using so far.
+If you're a Jupyter user, you can [download the notebook](python-api/python-api.ipynb) this document is based on.
+
## Do it again, in Python
First, lets do exactly the same thing as in our "Get started" guide, but using the Python API.
@@ -166,7 +168,7 @@ Dump it (in memory instead of on `sys.stdout` to print only the first few lines)
import io
f = io.StringIO()
learning_set.dump(problem, f)
-print("\n".join(f.getvalue().splitlines()[:6]))
+print("\n".join(f.getvalue().splitlines()[:6] + ['...']))
```
```text
@@ -176,6 +178,7 @@ name,"Criterion 1","Criterion 2","Criterion 3","Criterion 4",category
"Alternative 3",0.156018645,0.445832759,0.15599452,0.0999749228,"Worst category"
"Alternative 4",0.0580836125,0.4592489,0.866176128,0.333708614,"Best category"
"Alternative 5",0.601114988,0.14286682,0.708072603,0.650888503,"Intermediate category 1"
+...
```
@@ -817,4 +820,536 @@ Note however that learning objects (*e.g.* instances of `LearnMrsortByWeightsPro
### Create your own learning strategies
-@todo(Documentation, v1.1) Write this section. Include a demo of how to create a custom `Observer` that keeps the best model at iterations 1, 2, 4, *etc.*
+@todo(Documentation, v1.1) Introduce this section.
+
+
+```python
+problem = lc.Problem(
+ [
+ lc.Criterion("Criterion 1", lc.Criterion.RealValues(lc.Criterion.PreferenceDirection.decreasing, 0, 10)),
+ lc.Criterion("Criterion 2", lc.Criterion.IntegerValues(lc.Criterion.PreferenceDirection.increasing, 0, 100)),
+ lc.Criterion("Criterion 3", lc.Criterion.EnumeratedValues(["F", "E", "D", "C", "B", "A"])),
+ ],
+ [lc.Category("Bad"), lc.Category("Medium"), lc.Category("Good")],
+)
+model = lc.generate_mrsort_model(problem, random_seed=42)
+learning_set = lc.generate_alternatives(problem, model, alternatives_count=1000, random_seed=43)
+```
+
+#### `LearningData`
+
+First, let's get more familiar with the `LearningData`:
+
+
+```python
+learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43)
+```
+
+It contains two families of attributes.
+
+##### Input data
+
+The first one is about the problem and learning set. These attributes never change. First, the counts:
+
+
+```python
+(learning_data.criteria_count, learning_data.categories_count, learning_data.boundaries_count, learning_data.alternatives_count)
+```
+
+
+
+
+```text
+(3, 3, 2, 1000)
+```
+
+
+
+The learning set is pre-processed in the `LearningData` so that learning algorithms don't have to manipulate the different type of criterion values. In the `LearningData`, we keep only the ranks of the performances of each alternative in the learning set. The learning set is also destructured into a few arrays. Here are the attributes that describe this pre-processed learning set:
+
+The number of distinct values actually seen for each criterion (including the min and max values for numerical criteria):
+
+
+```python
+list(learning_data.values_counts) # Indexed by [criterion_index]
+```
+
+
+
+
+```text
+[1002, 101, 6]
+```
+
+
+
+
+```python
+(learning_data.values_counts[0], learning_data.values_counts[learning_data.criteria_count - 1])
+```
+
+
+
+
+```text
+(1002, 6)
+```
+
+
+
+We see that the learning data knows 1002 values for the real-valued criterion. This is usual as it's rare that two floating point values are exactly equal, so the 1000 alternatives have distinct values, and the min and max are two more values. The learning data contains 101 values for the integer-valued criterion, meaning that the alternatives in the learning set do actually cover the whole set of possible values. And similarly, 6 values for the enumerated criterion.
+
+For each criterion, the ranks of the performance of each alternative:
+
+
+```python
+[list(v)[:10] + ['...'] for v in learning_data.performance_ranks] # Indexed by [criterion_index][alternative_index]
+```
+
+
+
+
+```text
+[[883, 900, 753, 216, 365, 410, 302, 852, 738, 45, '...'],
+ [50, 13, 17, 86, 4, 2, 25, 81, 47, 87, '...'],
+ [3, 0, 1, 0, 3, 3, 2, 0, 0, 3, '...']]
+```
+
+
+
+
+```python
+(learning_data.performance_ranks[0][0], learning_data.performance_ranks[learning_data.criteria_count - 1][learning_data.alternatives_count - 1])
+```
+
+
+
+
+```text
+(883, 3)
+```
+
+
+
+The assignment of each alternative, *i.e.* the index of its category:
+
+
+```python
+list(learning_data.assignments)[:10] + ['...'] # Indexed by [alternative_index]
+```
+
+
+
+
+```text
+[2, 2, 2, 0, 1, 1, 1, 2, 2, 0, '...']
+```
+
+
+
+
+```python
+(learning_data.assignments[0], learning_data.assignments[learning_data.alternatives_count - 1])
+```
+
+
+
+
+```text
+(2, 2)
+```
+
+
+
+##### In-progress data
+
+The second family of attributes is about the WeightsProfilesBreed algorithm itself.
+
+The `LearningData` contains several "in progress" models. Their number is constant:
+
+
+```python
+learning_data.models_count
+```
+
+
+
+
+```text
+9
+```
+
+
+
+Each model comes with a uniform random bits generator (URBG for short):
+
+
+```python
+[str(urbg)[:43] + '>' for urbg in learning_data.urbgs] # Indexed by [model_index]
+```
+
+
+
+
+```text
+['',
+ '',
+ '',
+ '',
+ '',
+ '',
+ '',
+ '',
+ '']
+```
+
+
+
+This lets heuristic strategies operate in parallel on models and still produce deterministic results. URBGs are callable to get the next pseudo-random integer:
+
+
+```python
+[r() for r in learning_data.urbgs]
+```
+
+
+
+
+```text
+[494155588,
+ 870190228,
+ 2450414687,
+ 641676058,
+ 661088198,
+ 363471047,
+ 1448606581,
+ 1348129397,
+ 2542538607]
+```
+
+
+
+WPB learning is iterative, and the `iteration_index` is stored in the learning data. It starts at zero and tells you the current iteration:
+
+
+```python
+learning_data.iteration_index
+```
+
+
+
+
+```text
+0
+```
+
+
+
+The remaining attributes are modified at each iteration, and start uninitialized. For this presentation, we'll first run one iteration of WPB so that their values make sense.
+
+
+```python
+learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43)
+profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)
+weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)
+profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)
+breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)
+termination_strategy = lc.TerminateAfterIterations(learning_data, max_iterations_count=1)
+
+lc.LearnMrsortByWeightsProfilesBreed(
+ learning_data,
+ profiles_initialization_strategy,
+ weights_optimization_strategy,
+ profiles_improvement_strategy,
+ breeding_strategy,
+ termination_strategy,
+).perform()
+
+assert(learning_data.iteration_index == 0)
+```
+
+Its `model_indexes` contains indexes of models in increasing order of accuracy.
+
+
+```python
+list(learning_data.model_indexes)
+```
+
+
+
+
+```text
+[1, 5, 4, 8, 3, 6, 2, 0, 7]
+```
+
+
+
+Its `accuracies` attribute holds the accuracy of each model. They are stored as the count of correctly-classified alternatives, between 0 and `alternatives_count` included:
+
+
+```python
+list(learning_data.accuracies) # Indexed by model_index
+```
+
+
+
+
+```text
+[728, 593, 725, 671, 637, 609, 676, 833, 640]
+```
+
+
+
+If you iterate the `accuracies` in the order of `model_indexes`, they are sorted:
+
+
+```python
+[learning_data.accuracies[index] for index in learning_data.model_indexes] == sorted(learning_data.accuracies)
+```
+
+
+
+
+```text
+True
+```
+
+
+
+@todo(Documentation, v1.1) Introduce profiles
+
+
+```python
+[[list(vv) for vv in v] for v in learning_data.profile_ranks] # Indexed by [model_index][boundary_index][criterion_index]
+```
+
+
+
+
+```text
+[[[124, 9, 0], [633, 9, 3]],
+ [[492, 8, 1], [965, 8, 4]],
+ [[268, 15, 0], [506, 54, 3]],
+ [[230, 8, 1], [272, 26, 4]],
+ [[201, 1, 1], [201, 2, 3]],
+ [[86, 64, 0], [86, 99, 0]],
+ [[223, 60, 2], [310, 80, 5]],
+ [[235, 20, 2], [595, 20, 3]],
+ [[261, 52, 0], [262, 52, 3]]]
+```
+
+
+
+@todo(Documentation, v1.1) Introduce weights
+
+
+```python
+[list(v) for v in learning_data.weights] # Indexed by [model_index][criterion_index]
+```
+
+
+
+
+```text
+[[1.0132789611816406e-06, 0.9999989867210388, 1.0132789611816406e-06],
+ [0.9999989867210388, 0.9999989867210388, 1.0132789611816406e-06],
+ [1.0, 0.0, 0.9999989867210388],
+ [0.5000004768371582, 0.4999994933605194, 0.4999994933605194],
+ [1.0132789611816406e-06, 0.9999989867210388, 0.0],
+ [0.9999989867210388, 0.0, 1.0132789611816406e-06],
+ [1.0, 0.0, 0.0],
+ [1.0, 0.9999989867210388, 1.0132789611816406e-06],
+ [0.9999989867210388, 0.0, 0.9999989867210388]]
+```
+
+
+
+#### `Observer`
+
+With this better understanding of `LearningData`, let's write our own `Observer` strategy. It's arguably the simplest to starts with, because it's not expected to *change* the `LearningData`.
+
+To start as simple as possible, lets reproduce the behavior of the `--...-verbose` flag on the command line, by creating an observer that just prints the best accuracy at each step.
+
+`Observer` strategies must define two methods to be called by the learning algorithm: `after_iteration`, to be called at the end of each iteration, after the breeding of models is done, and `before_return`, to be called just before the final model is returned.
+
+
+```python
+class VerboseObserver(lc.LearnMrsortByWeightsProfilesBreed.Observer):
+ def __init__(self, learning_data):
+ super().__init__()
+ self.learning_data = learning_data
+
+ def after_iteration(self):
+ print(f"Best accuracy (after {self.learning_data.iteration_index + 1} iterations): {self.learning_data.get_best_accuracy()}")
+
+ def before_return(self):
+ print(f"Final accuracy (after {self.learning_data.iteration_index + 1} iterations): {self.learning_data.get_best_accuracy()}")
+```
+
+We can now pass it to a learning and perform that learning to observe its effects:
+
+
+```python
+profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)
+weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)
+profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)
+breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)
+termination_strategy = lc.TerminateAtAccuracy(learning_data, target_accuracy=len(learning_set.alternatives))
+observer = VerboseObserver(learning_data)
+
+learned_model = lc.LearnMrsortByWeightsProfilesBreed(
+ learning_data,
+ profiles_initialization_strategy,
+ weights_optimization_strategy,
+ profiles_improvement_strategy,
+ breeding_strategy,
+ termination_strategy,
+ [observer],
+).perform()
+```
+
+```text
+Best accuracy (after 1 iterations): 938
+Best accuracy (after 2 iterations): 992
+Best accuracy (after 3 iterations): 997
+Best accuracy (after 4 iterations): 997
+Best accuracy (after 5 iterations): 997
+Best accuracy (after 6 iterations): 997
+Best accuracy (after 7 iterations): 997
+Best accuracy (after 8 iterations): 999
+Final accuracy (after 9 iterations): 1000
+```
+
+
+Now let's do something slightly more complicated: our goal for `IntermediatesObserver` is to keep track of the best model so far at different times during the learning. Specifically, we want to keep the models at iterations 1, 2, 4, 8, *etc.*.
+
+
+```python
+import math
+
+class IntermediatesObserver(lc.LearnMrsortByWeightsProfilesBreed.Observer):
+ def __init__(self, problem, learning_data):
+ super().__init__()
+ self.problem = problem
+ self.learning_data = learning_data
+ self.intermediate_models = []
+
+ def after_iteration(self):
+ if math.log2(self.learning_data.iteration_index + 1).is_integer():
+ self.intermediate_models.append(self.learning_data.get_best_model())
+
+ def before_return(self):
+ pass
+
+learning_data = lc.LearnMrsortByWeightsProfilesBreed.LearningData(problem, learning_set, models_count=9, random_seed=43) # Do *not* reuse the same `LearningData` for several learnings
+profiles_initialization_strategy = lc.InitializeProfilesForProbabilisticMaximalDiscriminationPowerPerCriterion(learning_data)
+weights_optimization_strategy = lc.OptimizeWeightsUsingGlop(learning_data)
+profiles_improvement_strategy = lc.ImproveProfilesWithAccuracyHeuristicOnCpu(learning_data)
+breeding_strategy = lc.ReinitializeLeastAccurate(learning_data, profiles_initialization_strategy=profiles_initialization_strategy, count=4)
+termination_strategy = lc.TerminateAtAccuracy(learning_data, target_accuracy=len(learning_set.alternatives))
+observer = IntermediatesObserver(problem, learning_data)
+
+final_model = lc.LearnMrsortByWeightsProfilesBreed(
+ learning_data,
+ profiles_initialization_strategy,
+ weights_optimization_strategy,
+ profiles_improvement_strategy,
+ breeding_strategy,
+ termination_strategy,
+ [observer],
+).perform()
+
+for model in observer.intermediate_models:
+ model.dump(problem, sys.stdout)
+final_model.dump(problem, sys.stdout)
+```
+
+```yaml
+kind: ncs-classification-model
+format_version: 1
+accepted_values:
+ - kind: thresholds
+ thresholds: [7.7909708, 4.06594753]
+ - kind: thresholds
+ thresholds: [20, 20]
+ - kind: thresholds
+ thresholds: [D, C]
+sufficient_coalitions:
+ - &coalitions
+ kind: weights
+ criterion_weights: [1, 0.999998987, 1.01327896e-06]
+ - *coalitions
+kind: ncs-classification-model
+format_version: 1
+accepted_values:
+ - kind: thresholds
+ thresholds: [7.95116329, 3.89878368]
+ - kind: thresholds
+ thresholds: [0, 21]
+ - kind: thresholds
+ thresholds: [C, B]
+sufficient_coalitions:
+ - &coalitions
+ kind: weights
+ criterion_weights: [1, 0, 1]
+ - *coalitions
+kind: ncs-classification-model
+format_version: 1
+accepted_values:
+ - kind: thresholds
+ thresholds: [7.96338844, 3.82566905]
+ - kind: thresholds
+ thresholds: [73, 84]
+ - kind: thresholds
+ thresholds: [B, B]
+sufficient_coalitions:
+ - &coalitions
+ kind: weights
+ criterion_weights: [1, 0, 1]
+ - *coalitions
+kind: ncs-classification-model
+format_version: 1
+accepted_values:
+ - kind: thresholds
+ thresholds: [7.96338844, 3.74707603]
+ - kind: thresholds
+ thresholds: [94, 99]
+ - kind: thresholds
+ thresholds: [B, B]
+sufficient_coalitions:
+ - &coalitions
+ kind: weights
+ criterion_weights: [1, 0, 1]
+ - *coalitions
+kind: ncs-classification-model
+format_version: 1
+accepted_values:
+ - kind: thresholds
+ thresholds: [7.95116329, 3.74707603]
+ - kind: thresholds
+ thresholds: [94, 99]
+ - kind: thresholds
+ thresholds: [B, B]
+sufficient_coalitions:
+ - &coalitions
+ kind: weights
+ criterion_weights: [1, 0, 1]
+ - *coalitions
+```
+
+
+#### Other strategies
+
+@todo(Documentation, v1.1) Write this section
+
+
+```python
+class SillyWeightsStrategy(lc.LearnMrsortByWeightsProfilesBreed.WeightsOptimizationStrategy):
+ pass
+```
+
+
+```python
+class SillyProfilesStrategy(lc.LearnMrsortByWeightsProfilesBreed.ProfilesImprovementStrategy):
+ pass
+```
diff --git a/docs/_sources/reference/lincs.rst.txt b/docs/_sources/reference/lincs.rst.txt
index 8647d341..e17ce245 100644
--- a/docs/_sources/reference/lincs.rst.txt
+++ b/docs/_sources/reference/lincs.rst.txt
@@ -26,6 +26,14 @@
Raised by learning algorithms when they can't reach their objective.
+ .. class:: UniformRandomBitsGenerator
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. method:: __call__(arg: UniformRandomBitsGenerator1) -> int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
.. module:: lincs.classification
The ``lincs.classification`` module
@@ -654,7 +662,7 @@
@todo(Documentation, v1.1) Add a docstring.
- .. method:: __init__(problem: Problem, learning_set: Alternatives)
+ .. method:: __init__(problem: Problem, learning_set: Alternatives [, nb_minimize_threads: int=0 [, timeout_fast_minimize: int=60 [, coef_minimize_time: int=2]]])
@todo(Documentation, v1.1) Add a docstring.
@@ -666,7 +674,7 @@
@todo(Documentation, v1.1) Add a docstring.
- .. method:: __init__(problem: Problem, learning_set: Alternatives)
+ .. method:: __init__(problem: Problem, learning_set: Alternatives [, nb_minimize_threads: int=0 [, timeout_fast_minimize: int=60 [, coef_minimize_time: int=2]]])
@todo(Documentation, v1.1) Add a docstring.
@@ -714,7 +722,48 @@
@todo(Documentation, v1.1) Add a docstring.
- .. method:: get_best_accuracy() -> int
+ .. property:: criteria_count
+ :type: int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: categories_count
+ :type: int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: boundaries_count
+ :type: int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: alternatives_count
+ :type: int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: values_counts
+ :type: Iterable[int]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: performance_ranks
+ :type: Iterable[Iterable[int]]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: assignments
+ :type: Iterable[int]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: models_count
+ :type: int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: urbgs
+ :type: Iterable[UniformRandomBitsGenerator]
@todo(Documentation, v1.1) Add a docstring.
@@ -723,6 +772,34 @@
@todo(Documentation, v1.1) Add a docstring.
+ .. property:: model_indexes
+ :type: Iterable[int]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: weights
+ :type: Iterable[Iterable[int]]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: profile_ranks
+ :type: Iterable[Iterable[Iterable[int]]]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. property:: accuracies
+ :type: Iterable[int]
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. method:: get_best_accuracy() -> int
+
+ @todo(Documentation, v1.1) Add a docstring.
+
+ .. method:: get_best_model() -> Model
+
+ @todo(Documentation, v1.1) Add a docstring.
+
.. class:: ProfilesInitializationStrategy
@todo(Documentation, v1.1) Add a docstring.
@@ -855,7 +932,7 @@
@todo(Documentation, v1.1) Add a docstring.
- .. method:: __init__(learning_data: LearningData, max_iteration_index: int)
+ .. method:: __init__(learning_data: LearningData, max_iterations_count: int)
@todo(Documentation, v1.1) Add a docstring.
diff --git a/docs/_sources/user-guide.rst.txt b/docs/_sources/user-guide.rst.txt
index ff43dbb6..c044281f 100644
--- a/docs/_sources/user-guide.rst.txt
+++ b/docs/_sources/user-guide.rst.txt
@@ -512,7 +512,7 @@ They produce a different kind of model, with the sufficient coalitions specified
.. code:: yaml
- # Reproduction command (with lincs version 1.1.0a5): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions
+ # Reproduction command (with lincs version 1.1.0a6): lincs learn classification-model problem.yml learning-set.csv --model-type ucncs --ucncs.strategy sat-by-coalitions
kind: ncs-classification-model
format_version: 1
accepted_values:
diff --git a/docs/_static/documentation_options.js b/docs/_static/documentation_options.js
index 236873b3..e705bc86 100644
--- a/docs/_static/documentation_options.js
+++ b/docs/_static/documentation_options.js
@@ -1,6 +1,6 @@
var DOCUMENTATION_OPTIONS = {
URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'),
- VERSION: '1.1.0a5',
+ VERSION: '1.1.0a6',
LANGUAGE: 'en',
COLLAPSE_INDEX: false,
BUILDER: 'html',
diff --git a/docs/changelog.html b/docs/changelog.html
index 15847c16..029c458d 100644
--- a/docs/changelog.html
+++ b/docs/changelog.html
@@ -5,11 +5,11 @@
- Changelog — lincs 1.1.0a5 documentation
+ Changelog — lincs 1.1.0a6 documentation
-
+
@@ -34,6 +34,28 @@
Changelog
+
+Version 1.1.0a6 (2024-02-06)
+
+Breaking Rename max_iteration_index
to max_iterations_count
in ...TerminateAfterIterations.__init__
+Make the Python API guide Jupyter Notebook downloadable
+Expose all attributes of WPB.LearningData
; start to document them in our Python API guide
+Expose parameters of EvalMaxSAT in our API and command-line interface (see lincs learn classification-model --help
):
+
+
+--ucncs.max-sat-by-separation.solver
(for consistency, always "eval-max-sat"
for now)
+--ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads
+--ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize
+--ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time
+--ucncs.max-sat-by-coalitions.solver
(for consistency, always "eval-max-sat"
for now)
+--ucncs.max-sat-by-coalitions.eval-max-sat.nb-minimize-threads
+--ucncs.max-sat-by-coalitions.eval-max-sat.timeout-fast-minimize
+--ucncs.max-sat-by-coalitions.eval-max-sat.coef-minimize-time
+
+
+
+
+
Version 1.1.0a5 (2024-02-01)
@@ -346,6 +368,7 @@ Navigation
Contributor guide
Roadmap
Changelog
+Version 1.1.0a6 (2024-02-06)
Version 1.1.0a5 (2024-02-01)
Versions 1.1.0a2 to 1.1.0a4 (2024-01-29)
Versions 1.1.0a0 (2024-01-10), 1.1.0a1 (2024-01-11)
diff --git a/docs/conceptual-overview.html b/docs/conceptual-overview.html
index 8f4f34cb..e7717edf 100644
--- a/docs/conceptual-overview.html
+++ b/docs/conceptual-overview.html
@@ -5,11 +5,11 @@
- Conceptual overview — lincs 1.1.0a5 documentation
+ Conceptual overview — lincs 1.1.0a6 documentation
-
+
diff --git a/docs/contributor-guide.html b/docs/contributor-guide.html
index 6a3586ce..597e0b64 100644
--- a/docs/contributor-guide.html
+++ b/docs/contributor-guide.html
@@ -5,11 +5,11 @@
- Contributor guide — lincs 1.1.0a5 documentation
+ Contributor guide — lincs 1.1.0a6 documentation
-
+
diff --git a/docs/genindex.html b/docs/genindex.html
index 9a91d44e..a5d61393 100644
--- a/docs/genindex.html
+++ b/docs/genindex.html
@@ -4,11 +4,11 @@
- Index — lincs 1.1.0a5 documentation
+ Index — lincs 1.1.0a6 documentation
-
+
@@ -292,8 +292,6 @@ Symbols
lincs-learn-classification-model command line option
-
-
+
+
--output-model
@@ -407,6 +407,62 @@ Symbols
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.coef-minimize-time
+
+
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.nb-minimize-threads
+
+
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.timeout-fast-minimize
+
+
+
+ --ucncs.max-sat-by-coalitions.solver
+
+
+
+ --ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time
+
+
+
+ --ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads
+
+
+
+ --ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize
+
+
+
+ --ucncs.max-sat-by-separation.solver
+
+
@@ -508,6 +564,8 @@ Symbols
_
@@ -646,6 +710,8 @@ B
+ criteria_count (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData property) , [1]
+
Criterion (class in lincs.classification) , [1]
Criterion.EnumeratedValues (class in lincs.classification) , [1]
@@ -752,11 +822,13 @@ G
generate_mrsort_model() (in module lincs.classification) , [1]
-
-
+
get_best_accuracy() (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData method) , [1]
+
+ get_best_model() (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData method) , [1]
get_value_rank() (lincs.classification.Criterion.EnumeratedValues method) , [1]
@@ -1081,6 +1153,22 @@ L
--mrsort.weights-profiles-breed.weights-strategy
--output-model
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.coef-minimize-time
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.nb-minimize-threads
+
+ --ucncs.max-sat-by-coalitions.eval-max-sat.timeout-fast-minimize
+
+ --ucncs.max-sat-by-coalitions.solver
+
+ --ucncs.max-sat-by-separation.eval-max-sat.coef-minimize-time
+
+ --ucncs.max-sat-by-separation.eval-max-sat.nb-minimize-threads
+
+ --ucncs.max-sat-by-separation.eval-max-sat.timeout-fast-minimize
+
+ --ucncs.max-sat-by-separation.solver
--ucncs.strategy
@@ -1159,6 +1247,10 @@ M
Model (class in lincs.classification) , [1]
Model.JSON_SCHEMA (in module lincs.classification) , [1]
+
+ model_indexes (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData property) , [1]
+
+ models_count (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData property) , [1]
module
@@ -1239,6 +1331,8 @@ P
Performance.Integer (class in lincs.classification) , [1]
Performance.Real (class in lincs.classification) , [1]
+
+ performance_ranks (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData property) , [1]
PRE
@@ -1281,6 +1375,8 @@ P
Problem.JSON_SCHEMA (in module lincs.classification) , [1]
profile (lincs.classification.Alternative property) , [1]
+
+ profile_ranks (lincs.classification.LearnMrsortByWeightsProfilesBreed.LearningData property) , [1]
@@ -1386,10 +1482,14 @@ U
@@ -1405,8 +1505,6 @@ V
(lincs.classification.Performance.Real property) , [1]
-
-
+
@@ -1423,9 +1525,11 @@ V
W