intel
diff --git a/‎neural_compressor/adaptor/torch_utils/hawq_metric.py‎
Lines changed: 9 additions & 9 deletions b/‎neural_compressor/adaptor/torch_utils/hawq_metric.py‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎neural_compressor/contrib/strategy/sigopt.py‎
Lines changed: 1 addition & 1 deletion b/‎neural_compressor/contrib/strategy/sigopt.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎neural_compressor/contrib/strategy/tpe.py‎
Lines changed: 1 addition & 0 deletions b/‎neural_compressor/contrib/strategy/tpe.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎neural_compressor/strategy/auto.py‎
Lines changed: 3 additions & 6 deletions b/‎neural_compressor/strategy/auto.py‎
Lines changed: 3 additions & 6 deletions
diff --git a/‎neural_compressor/strategy/auto_mixed_precision.py‎
Lines changed: 1 addition & 2 deletions b/‎neural_compressor/strategy/auto_mixed_precision.py‎
Lines changed: 1 addition & 2 deletions
@@ -52,9 +52,9 @@ def remove(self):
 class HessianTrace:
     """HessianTrace Class.
 
-    Please refer to Yao, Zhewei, et al. "Pyhessian: Neural networks through the lens of the hessian." 
+    Please refer to Yao, Zhewei, et al. "Pyhessian: Neural networks through the lens of the hessian."
     2020 IEEE international conference on big data (Big data). IEEE, 2020.
-    Dong, Zhen, et al. "Hawq-v2: Hessian aware trace-weighted quantization of neural networks." 
+    Dong, Zhen, et al. "Hawq-v2: Hessian aware trace-weighted quantization of neural networks."
     Advances in neural information processing systems 33 (2020): 18518-18529.
     https://github.com/openvinotoolkit/nncf/blob/develop/nncf/torch/quantization/hessian_trace.py
     """
@@ -173,7 +173,7 @@ def act_grad_hook(model, grad_input, grad_output):
     def _get_enable_act_grad_hook(self, name):
         def enable_act_grad_hook(model, inputs, outputs):
             input = inputs[0]
-            if input.requires_grad is False:
+            if input.requires_grad is False: #
                 input.requires_grad = True
             self.layer_acts[name] = input
 
@@ -251,13 +251,13 @@ def _sample_rademacher(self, params):
             r.masked_fill_(r == 0, -1)
             samples.append(r)
         return samples
-    
+
     def _sample_rademacher_like_params(self):
         def sample(parameter):
             r = torch.randint_like(parameter, high=2, device=self.device)
             return r.masked_fill_(r == 0, -1)
         return [sample(p) for p in self.params]
-    
+
     def _sample_normal_like_params(self):
         return [torch.randn(p.size(), device=self.device) for p in self.params]
 
@@ -391,7 +391,7 @@ def _insert_hook(self, model, target_module_list):
         for layer, module in model.named_modules():
             for target_module in target_module_list:
                 # print("layer:",layer)
-                # print("target_model:",target_module)   
+                # print("target_model:",target_module)
                 if layer == target_module:
                     logging.debug("Collect: %s" % (module))
                     # print("Collect: %s" % (module))
@@ -408,7 +408,7 @@ def _insert_hook_quantize(self, model, target_module_list):
                 # print("layer:",layer)
                 length = len("_model.")
                 new_key = layer[length:]
-                # print("target_model:",target_module)   
+                # print("target_model:",target_module)
                 if new_key == target_module:
                     logging.debug("Collect: %s" % (module))
                     # print("Collect: %s" % (module))
@@ -521,7 +521,7 @@ def compare_weights(
         float_dict: Dict[str, Any], quantized_dict: Dict[str, Any]
 ) -> Dict[str, Dict[str, torch.Tensor]]:
     r"""Compare the weights of the float module with its corresponding quantized module.
-    
+
     Returns a dict with key corresponding to module names and each entry being
     a dictionary with two keys 'float' and 'quantized', containing the float and
     quantized weights. This dict can be used to compare and compute the quantization
@@ -608,7 +608,7 @@ def hawq_top(fp32_model, q_model, dataloader, criterion, enable_act):
         op_qnt_tensor = weight_quant_loss[key]['quantized'].dequantize()
         diff_l2 = (torch.norm(op_float_tensor - op_qnt_tensor, p=2) ** 2)
         pertur_lst[key] = diff_l2
-    
+
     if enable_act:
         act_to_traces = traces['activation']
         for trace_i, pertur_i, act_i in zip(op_to_traces.keys(), pertur_lst.keys(), act_to_traces.keys()):
 
@@ -194,7 +194,7 @@ def traverse(self):
 
         This is SigOpt version of traverse -- with additional constraints setting to HPO.
         """
-        self._eval_baseline()
+        self._prepare_tuning()
 
         baseline_msg = '[Accuracy: {:.4f}'.format(self.baseline[0]) + \
             ''.join([', {}: {:.4f}'.format(x,y) for x,y in zip( \
 
@@ -191,6 +191,7 @@ def _configure_hpopt_search_space_and_params(self, search_space):
     def traverse(self):
         """Tpe traverse logic."""
         logger.info("Start to run tpe strategy.")
+        self._prepare_tuning()
         # prepare log file
         trials_file = os.path.join(os.path.dirname(self.history_path), 'tpe_trials.csv')
         best_result_file = os.path.join(os.path.dirname(self.history_path), 'tpe_best_result.csv')
 
@@ -79,13 +79,10 @@ def sequential_traverse(self):
                 eval_dataloader=self.eval_dataloader,
                 eval_metric=self.eval_metric,
                 resume=self._resume,
-                q_hooks=self.q_hooks)
+                q_hooks=self.q_hooks,
+                pre_strategy = pre_strategy
+                )
 
-            if pre_strategy:
-                #TODO add tuning history from the previous stage to current stage.
-                strategy.baseline = deepcopy(pre_strategy.baseline)
-                strategy.trials_count = pre_strategy.trials_count
-                strategy.objectives.baseline = deepcopy(pre_strategy.baseline)
             pre_strategy = strategy
             strategy.traverse()
             self.best_qmodel = strategy.best_qmodel
 
@@ -128,8 +128,7 @@ def next_tune_cfg(self):
 
     def traverse(self):
         """Traverse the tuning space according to auto-mixed precision strategy."""
-        # get fp32 model baseline
-        self._eval_baseline()
+        self._prepare_tuning()
 
         for op_tuning_cfg in self.next_tune_cfg():
             # add tune_cfg here as quantize use tune_cfg