fix domain detection for large model (#565)

yuwenzho · web-flow · commit 70a566239d44 · 2023-02-28T13:55:41.000+08:00
Signed-off-by: yuwenzho &lt;yuwen.zhou@intel.com&gt;
diff --git a/neural_compressor/adaptor/onnxrt.py b/neural_compressor/adaptor/onnxrt.py
@@ -636,7 +636,12 @@ def _detect_domain(self, model):
         # 2. according to input
         # typically, NLP models have multiple inputs, 
         # and the dimension of each input is usually 2 (batch_size, max_seq_len)
-        sess = ort.InferenceSession(model.model.SerializeToString())
+        if not model.is_large_model:
+            sess = ort.InferenceSession(model.model.SerializeToString())
+        elif model.model_path is not None: # pragma: no cover
+            sess = ort.InferenceSession(model.model_path)
+        else: # pragma: no cover
+            assert False, "Please use model path instead of onnx model object to quantize."
         input_shape_lens = [len(input.shape) for input in  sess.get_inputs()]
         if len(input_shape_lens) > 1 and all(shape_len == 2 for shape_len in input_shape_lens):
             is_nlp = True