From 3ca502498d054fb9ca52eb4e2cae1eee5ffc7f34 Mon Sep 17 00:00:00 2001
From: Yuge Zhang <Yuge.Zhang@microsoft.com>
Date: Fri, 4 Jun 2021 15:06:08 +0900
Subject: [PATCH 1/5] Fix data race issue on Retiarii RL

---
 nni/retiarii/strategy/_rl_impl.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/nni/retiarii/strategy/_rl_impl.py b/nni/retiarii/strategy/_rl_impl.py
index 52bee6fadd..7e038aab69 100644
--- a/nni/retiarii/strategy/_rl_impl.py
+++ b/nni/retiarii/strategy/_rl_impl.py
@@ -1,6 +1,7 @@
 # This file might cause import error for those who didn't install RL-related dependencies
 
 import logging
+import threading
 from multiprocessing.pool import ThreadPool
 
 import gym
@@ -18,6 +19,7 @@
 
 
 _logger = logging.getLogger(__name__)
+_thread_lock = threading.Lock()
 
 
 class MultiThreadEnvWorker(EnvWorker):
@@ -100,7 +102,8 @@ def step(self, action):
                 if self.cur_step < self.num_steps else self.action_dim
         }
         if self.cur_step == self.num_steps:
-            model = get_targeted_model(self.base_model, self.mutators, self.sample)
+            with _thread_lock:
+                model = get_targeted_model(self.base_model, self.mutators, self.sample)
             _logger.info(f'New model created: {self.sample}')
             submit_models(model)
             wait_models(model)

From 5b564256a3eae455d2a79fe41288b08cf37da9a3 Mon Sep 17 00:00:00 2001
From: Yuge Zhang <Yuge.Zhang@microsoft.com>
Date: Fri, 4 Jun 2021 18:59:32 +0900
Subject: [PATCH 2/5] Update docstring in TPE and fix missing label in base
 mutator

---
 nni/retiarii/nn/pytorch/mutator.py    | 10 +++++-----
 nni/retiarii/strategy/tpe_strategy.py | 12 ++++++++++++
 2 files changed, 17 insertions(+), 5 deletions(-)

diff --git a/nni/retiarii/nn/pytorch/mutator.py b/nni/retiarii/nn/pytorch/mutator.py
index 6ef2ef19af..81c582669c 100644
--- a/nni/retiarii/nn/pytorch/mutator.py
+++ b/nni/retiarii/nn/pytorch/mutator.py
@@ -15,7 +15,7 @@
 
 class LayerChoiceMutator(Mutator):
     def __init__(self, nodes: List[Node]):
-        super().__init__()
+        super().__init__(label=nodes[0].operation.parameters['label'])
         self.nodes = nodes
 
     def mutate(self, model):
@@ -40,7 +40,7 @@ def mutate(self, model):
 
 class InputChoiceMutator(Mutator):
     def __init__(self, nodes: List[Node]):
-        super().__init__()
+        super().__init__(label=nodes[0].operation.parameters['label'])
         self.nodes = nodes
 
     def mutate(self, model):
@@ -56,7 +56,7 @@ def mutate(self, model):
 
 class ValueChoiceMutator(Mutator):
     def __init__(self, nodes: List[Node], candidates: List[Any]):
-        super().__init__()
+        super().__init__(label=nodes[0].operation.parameters['label'])
         self.nodes = nodes
         self.candidates = candidates
 
@@ -69,7 +69,7 @@ def mutate(self, model):
 
 class ParameterChoiceMutator(Mutator):
     def __init__(self, nodes: List[Tuple[Node, str]], candidates: List[Any]):
-        super().__init__()
+        super().__init__(label=nodes[0].operation.parameters['label'])
         self.nodes = nodes
         self.candidates = candidates
 
@@ -84,7 +84,7 @@ def mutate(self, model):
 class RepeatMutator(Mutator):
     def __init__(self, nodes: List[Node]):
         # nodes is a subgraph consisting of repeated blocks.
-        super().__init__()
+        super().__init__(label=nodes[0].operation.parameters['label'])
         self.nodes = nodes
 
     def _retrieve_chain_from_graph(self, graph: Graph) -> List[Node]:
diff --git a/nni/retiarii/strategy/tpe_strategy.py b/nni/retiarii/strategy/tpe_strategy.py
index 7d897cbfb3..811ec4c4ef 100644
--- a/nni/retiarii/strategy/tpe_strategy.py
+++ b/nni/retiarii/strategy/tpe_strategy.py
@@ -40,6 +40,18 @@ def choice(self, candidates, mutator, model, index):
 
 
 class TPEStrategy(BaseStrategy):
+    """
+    The Tree-structured Parzen Estimator (TPE) [1]_ is a sequential model-based optimization (SMBO) approach.
+    SMBO methods sequentially construct models to approximate the performance of hyperparameters based on historical measurements,
+    and then subsequently choose new hyperparameters to test based on this model.
+
+    References
+    ----------
+
+    .. [1] Bergstra et al., "Algorithms for Hyper-Parameter Optimization".
+        https://papers.nips.cc/paper/4443-algorithms-for-hyper-parameter-optimization.pdf
+    """
+
     def __init__(self):
         self.tpe_sampler = TPESampler()
         self.model_id = 0

From 3c2e3d64a2b94dbca5be152ca76954322b530cda Mon Sep 17 00:00:00 2001
From: Yuge Zhang <Yuge.Zhang@microsoft.com>
Date: Mon, 7 Jun 2021 11:42:35 +0900
Subject: [PATCH 3/5] Fix doc lint issue

---
 nni/retiarii/nn/pytorch/component.py  | 6 +++---
 nni/retiarii/strategy/tpe_strategy.py | 4 ++--
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/nni/retiarii/nn/pytorch/component.py b/nni/retiarii/nn/pytorch/component.py
index 4ae5dc03bb..20c6e30de5 100644
--- a/nni/retiarii/nn/pytorch/component.py
+++ b/nni/retiarii/nn/pytorch/component.py
@@ -72,7 +72,7 @@ def _replicate_and_instantiate(blocks, repeat):
 
 class Cell(nn.Module):
     """
-    Cell structure [1]_ [2]_ that is popularly used in NAS literature.
+    Cell structure [zophnas]_ [zophnasnet]_ that is popularly used in NAS literature.
 
     A cell consists of multiple "nodes". Each node is a sum of multiple operators. Each operator is chosen from
     ``op_candidates``, and takes one input from previous nodes and predecessors. Predecessor means the input of cell.
@@ -95,8 +95,8 @@ class Cell(nn.Module):
 
     References
     ----------
-    .. [1] Barret Zoph, Quoc V. Le, "Neural Architecture Search with Reinforcement Learning". https://arxiv.org/abs/1611.01578
-    .. [2] Barret Zoph, Vijay Vasudevan, Jonathon Shlens, Quoc V. Le,
+    .. [zophnas] Barret Zoph, Quoc V. Le, "Neural Architecture Search with Reinforcement Learning". https://arxiv.org/abs/1611.01578
+    .. [zophnasnet] Barret Zoph, Vijay Vasudevan, Jonathon Shlens, Quoc V. Le,
         "Learning Transferable Architectures for Scalable Image Recognition". https://arxiv.org/abs/1707.07012
     """
 
diff --git a/nni/retiarii/strategy/tpe_strategy.py b/nni/retiarii/strategy/tpe_strategy.py
index 811ec4c4ef..7f55ad302e 100644
--- a/nni/retiarii/strategy/tpe_strategy.py
+++ b/nni/retiarii/strategy/tpe_strategy.py
@@ -41,14 +41,14 @@ def choice(self, candidates, mutator, model, index):
 
 class TPEStrategy(BaseStrategy):
     """
-    The Tree-structured Parzen Estimator (TPE) [1]_ is a sequential model-based optimization (SMBO) approach.
+    The Tree-structured Parzen Estimator (TPE) [bergstrahpo]_ is a sequential model-based optimization (SMBO) approach.
     SMBO methods sequentially construct models to approximate the performance of hyperparameters based on historical measurements,
     and then subsequently choose new hyperparameters to test based on this model.
 
     References
     ----------
 
-    .. [1] Bergstra et al., "Algorithms for Hyper-Parameter Optimization".
+    .. [bergstrahpo] Bergstra et al., "Algorithms for Hyper-Parameter Optimization".
         https://papers.nips.cc/paper/4443-algorithms-for-hyper-parameter-optimization.pdf
     """
 

From e3f4a016cee2fee200b47251e80a3f4e6f0754a7 Mon Sep 17 00:00:00 2001
From: Yuge Zhang <Yuge.Zhang@microsoft.com>
Date: Mon, 7 Jun 2021 12:50:03 +0900
Subject: [PATCH 4/5] Fix parameter choice test

---
 nni/retiarii/nn/pytorch/mutator.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/nni/retiarii/nn/pytorch/mutator.py b/nni/retiarii/nn/pytorch/mutator.py
index 81c582669c..5724ae46f1 100644
--- a/nni/retiarii/nn/pytorch/mutator.py
+++ b/nni/retiarii/nn/pytorch/mutator.py
@@ -69,7 +69,8 @@ def mutate(self, model):
 
 class ParameterChoiceMutator(Mutator):
     def __init__(self, nodes: List[Tuple[Node, str]], candidates: List[Any]):
-        super().__init__(label=nodes[0].operation.parameters['label'])
+        node, argname = nodes[0]
+        super().__init__(label=node.operation.parameters[argname].label)
         self.nodes = nodes
         self.candidates = candidates
 

From 4b9e9d78742adfea72a0eea943827e2a7b28289e Mon Sep 17 00:00:00 2001
From: Yuge Zhang <Yuge.Zhang@microsoft.com>
Date: Mon, 7 Jun 2021 15:54:08 +0900
Subject: [PATCH 5/5] fix typo: if -> while

---
 nni/retiarii/strategy/bruteforce.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/nni/retiarii/strategy/bruteforce.py b/nni/retiarii/strategy/bruteforce.py
index 379b159ba6..2e007cc0ab 100644
--- a/nni/retiarii/strategy/bruteforce.py
+++ b/nni/retiarii/strategy/bruteforce.py
@@ -62,7 +62,7 @@ def run(self, base_model, applied_mutators):
         search_space = dry_run_for_search_space(base_model, applied_mutators)
         for sample in grid_generator(search_space, shuffle=self.shuffle):
             _logger.debug('New model created. Waiting for resource. %s', str(sample))
-            if query_available_resources() <= 0:
+            while query_available_resources() <= 0:
                 time.sleep(self._polling_interval)
             submit_models(get_targeted_model(base_model, applied_mutators, sample))
 
@@ -113,6 +113,6 @@ def run(self, base_model, applied_mutators):
             search_space = dry_run_for_search_space(base_model, applied_mutators)
             for sample in random_generator(search_space, dedup=self.dedup):
                 _logger.debug('New model created. Waiting for resource. %s', str(sample))
-                if query_available_resources() <= 0:
+                while query_available_resources() <= 0:
                     time.sleep(self._polling_interval)
                 submit_models(get_targeted_model(base_model, applied_mutators, sample))