Minor things before next release (#154)

* Update docs, readme * Intersphinx * Fix MABWiser link * Notes and warnings * Bump version to v5.2.0
N-Wouda · Jun 10, 2023 · d5372dd · d5372dd
1 parent 963080d
commit d5372dd
Show file tree

Hide file tree

Showing 9 changed files with 136 additions and 126 deletions.
diff --git a/README.md b/README.md
@@ -15,10 +15,15 @@ operator selection scheme is updated based on the evaluation outcome.
 
 `alns` depends only on `numpy` and `matplotlib`. It may be installed in the
 usual way as
-
 ```
 pip install alns
 ```
+Additionally, to enable more advanced operator selection schemes using 
+multi-armed bandit algorithms, `alns` may be installed with the optional 
+[MABWiser][12] dependency:
+```
+pip install alns[mabwiser]
+```
 
 The documentation is available [here][1].
 
@@ -122,3 +127,5 @@ Or, using the following BibTeX entry:
 [10]: https://alns.readthedocs.io/en/latest/setup/template.html
 
 [11]: https://alns.readthedocs.io/en/latest/setup/introduction_to_alns.html
+
+[12]: https://github.com/fidelity/mabwiser
diff --git a/alns/State.py b/alns/State.py
@@ -15,19 +15,13 @@ def objective(self) -> float:
  """
 
 
-class ContextualState(Protocol):
+class ContextualState(State, Protocol):
  """
  Protocol for a solution state that also provides context. Solutions should
- define an ``objective()`` function as well as a ``get_context()``
- function.
+ define ``objective()`` and ``get_context()`` methods.
  """
 
- def objective(self) -> float:
- """
- Computes the state's associated objective value.
- """
-
  def get_context(self) -> np.ndarray:
  """
- Computes a context vector for the current state
+ Computes a context vector for the current state.
  """
diff --git a/alns/select/AlphaUCB.py b/alns/select/AlphaUCB.py
@@ -63,7 +63,7 @@ class AlphaUCB(OperatorSelectionScheme):
  ----------
  .. [1] Hendel, G. 2022. Adaptive large neighborhood search for mixed
  integer programming. *Mathematical Programming Computation* 14:
- 185 – 221.
+ 185 - 221.
  """
 
  def __init__(

diff --git a/alns/select/MABSelector.py b/alns/select/MABSelector.py
@@ -7,9 +7,10 @@
 from alns.State import ContextualState
 from alns.select.OperatorSelectionScheme import OperatorSelectionScheme
 
-MABWISER_AVAILABLE = True
 try:
  from mabwiser.mab import MAB, LearningPolicy, NeighborhoodPolicy
+
+ MABWISER_AVAILABLE = True
 except ModuleNotFoundError:
  MABWISER_AVAILABLE = False
 
@@ -18,6 +19,11 @@ class MABSelector(OperatorSelectionScheme):
  """
  A selector that uses any multi-armed-bandit algorithm from MABWiser.
 
+ .. warning::
+
+ ALNS does not install MABWiser by default. You can install it as an
+ extra dependency via ``pip install alns[mabwiser]``.
+
  This selector is a wrapper around the many multi-armed bandit algorithms
  available in the `MABWiser <https://github.com/fidelity/mabwiser>`_
  library. Since ALNS operator selection can be framed as a
@@ -26,9 +32,12 @@ class MABSelector(OperatorSelectionScheme):
  multi-armed-bandit algorithms as operator selectors instead of
  having to reimplement them.
 
- Note that if the provided learning policy is a contextual bandit
- algorithm, your state class must provide a `get_context` function that
- returns a context vector for the current state.
+ .. note::
+
+ If the provided learning policy is a contextual bandit algorithm, your
+ state class must implement a ``get_context`` method that returns a
+ context vector for the current state. See the
+ :class:`~alns.State.ContextualState` protocol for details.
 
  Parameters
  ----------
@@ -54,12 +63,15 @@ class MABSelector(OperatorSelectionScheme):
  Optional boolean matrix that indicates coupling between destroy and
  repair operators. Entry (i, j) is True if destroy operator i can be
  used together with repair operator j, and False otherwise.
+ kwargs
+ Any additional arguments. These will be passed to the underlying MAB
+ object.
 
  References
  ----------
  .. [1] Emily Strong, Bernard Kleynhans, & Serdar Kadioglu (2021).
  MABWiser: Parallelizable Contextual Multi-armed Bandits.
- Int. J. Artif. Intell. Tools, 30(4), 2150021:1–2150021:19.
+ Int. J. Artif. Intell. Tools, 30(4), 2150021: 1 - 19.
  """
 
  def __init__(
@@ -74,7 +86,11 @@ def __init__(
  **kwargs,
  ):
  if not MABWISER_AVAILABLE:
- raise ImportError("MABSelector requires the MABWiser library. ")
+ msg = """
+ The MABSelector requires the MABWiser dependency to be installed.
+ You can install it using `pip install alns[mabwiser]`.
+ """
+ raise ModuleNotFoundError(msg)
 
  super().__init__(num_destroy, num_repair, op_coupling)
 
@@ -85,26 +101,19 @@ def __init__(
  # More than four is OK because we only use the first four.
  raise ValueError(f"Expected four scores, found {len(scores)}")
 
- # forward the seed argument if not null
+ self._scores = scores
+
  if seed is not None:
  kwargs["seed"] = seed
 
- # the set of valid operator pairs (arms) is equal to the cartesian
- # product of destroy and repair operators, except we leave out any
- # pairs disallowed by op_coupling
  arms = [
  f"{d_idx}_{r_idx}"
  for d_idx in range(num_destroy)
  for r_idx in range(num_repair)
  if self._op_coupling[d_idx, r_idx]
  ]
- self._mab = MAB(
- arms,
- learning_policy,
- neighborhood_policy,
- **kwargs,
- )
- self._scores = scores
+
+ self._mab = MAB(arms, learning_policy, neighborhood_policy, **kwargs)
 
  @property
  def scores(self) -> List[float]:
@@ -125,19 +134,17 @@ def __call__( # type: ignore[override]
  strategy
  """
  if self._mab._is_initial_fit:
- has_context = self._mab.is_contextual
- context = (
- np.atleast_2d(curr.get_context()) if has_context else None
- )
- prediction = self._mab.predict(contexts=context)
+ has_ctx = self._mab.is_contextual
+ ctx = np.atleast_2d(curr.get_context()) if has_ctx else None
+ prediction = self._mab.predict(contexts=ctx)
  return arm2ops(prediction)
  else:
  # This can happen when the MAB object has not yet been fit on any
  # observations. In that case we return any feasible operator index
  # pair as a first observation.
  allowed = np.argwhere(self._op_coupling)
  idx = rnd_state.randint(len(allowed))
- return (allowed[idx][0], allowed[idx][1])
+ return allowed[idx][0], allowed[idx][1]
 
  def update( # type: ignore[override]
  self,
@@ -150,20 +157,19 @@ def update( # type: ignore[override]
  Updates the underlying MAB algorithm given the reward of the chosen
  destroy and repair operator combination ``(d_idx, r_idx)``.
  """
- has_context = self._mab.is_contextual
- context = np.atleast_2d(cand.get_context()) if has_context else None
-
+ has_ctx = self._mab.is_contextual
+ ctx = np.atleast_2d(cand.get_context()) if has_ctx else None
  self._mab.partial_fit(
  [ops2arm(d_idx, r_idx)],
  [self._scores[outcome]],
- contexts=context,
+ contexts=ctx,
  )
 
 
-def ops2arm(destroy_idx: int, repair_idx: int) -> str:
+def ops2arm(d_idx: int, r_idx: int) -> str:
  """
- Converts a tuple of destroy and repair operator indices to an arm
- string that can be passed to self._mab.
+ Converts the given destroy and repair operator indices to an arm string
+ that can be passed to the MAB instance.
 
  Examples
  --------
@@ -172,12 +178,12 @@ def ops2arm(destroy_idx: int, repair_idx: int) -> str:
  >>> ops2arm(12, 3)
  "12_3"
  """
- return f"{destroy_idx}_{repair_idx}"
+ return f"{d_idx}_{r_idx}"
 
 
 def arm2ops(arm: str) -> Tuple[int, int]:
  """
- Converts an arm string returned from self._mab to a tuple of destroy
+ Converts an arm string returned by the MAB instance into a tuple of destroy
  and repair operator indices.
 
  Examples
@@ -187,5 +193,5 @@ def arm2ops(arm: str) -> Tuple[int, int]:
  >>> arm2ops("12_3")
  (12, 3)
  """
- [destroy, repair] = arm.split("_")
- return int(destroy), int(repair)
+ d_idx, r_idx = map(int, arm.split("_"))
+ return d_idx, r_idx
diff --git a/alns/select/tests/test_mab.py → alns/select/tests/test_mab_selector.py b/alns/select/tests/test_mab.py → alns/select/tests/test_mab_selector.py
@@ -2,7 +2,7 @@
 
 import numpy.random as rnd
 from mabwiser.mab import LearningPolicy, NeighborhoodPolicy
-from numpy.testing import assert_equal, assert_raises
+from numpy.testing import assert_, assert_equal, assert_raises
 from pytest import mark
 
 from alns.Outcome import Outcome
@@ -29,25 +29,16 @@ def test_arm_conversion(destroy_idx, repair_idx):
 
 
 def test_does_not_raise_on_valid_mab():
- MABSelector([0, 0, 0, 0], 2, 1, LearningPolicy.EpsilonGreedy(0.15))
- MABSelector(
- [0, 0, 0, 0],
- 2,
- 1,
- LearningPolicy.EpsilonGreedy(0.15),
- NeighborhoodPolicy.Radius(5),
- )
- MABSelector(
- [0, 0, 0, 0],
- 2,
- 1,
- LearningPolicy.EpsilonGreedy(0.15),
- NeighborhoodPolicy.Radius(5),
- 1234567,
- )
+ policy = LearningPolicy.EpsilonGreedy(0.15)
+ select = MABSelector([5, 0, 3, 0], 2, 1, policy)
+ assert_equal(select.scores, [5, 0, 3, 0])
+ assert_(len(select.mab.arms), 2)
+
+ MABSelector([0, 0, 0, 0], 2, 1, policy, NeighborhoodPolicy.Radius(5))
  MABSelector(
- [0, 0, 0, 0], 2, 1, LearningPolicy.EpsilonGreedy(0.15), seed=1234567
+ [1, 0, 0, 0], 2, 1, policy, NeighborhoodPolicy.Radius(5), 1234567
  )
+ MABSelector([2, 1, 0, 0], 2, 1, policy, seed=1234567)
 
 
 @mark.parametrize(

diff --git a/docs/source/api/select.rst b/docs/source/api/select.rst
@@ -17,7 +17,9 @@ All operator selection schemes inherit from :class:`~alns.select.OperatorSelecti
  :members:
 
 .. automodule:: alns.select.MABSelector
- :members:
+
+ .. autoclass:: MABSelector
+ :members:
 
 .. automodule:: alns.select.RandomSelect
  :members:

diff --git a/docs/source/conf.py b/docs/source/conf.py
@@ -64,6 +64,7 @@
  "sphinx": ("https://www.sphinx-doc.org/en/master/", None),
  "numpy": ("https://numpy.org/doc/stable/", None),
  "matplotlib": ("https://matplotlib.org/stable/", None),
+ "mabwiser": ("https://fidelity.github.io/mabwiser/", None),
 }
 intersphinx_disabled_domains = ["std"]