Adjust pytorch distilbert notebook

bmyrcha · bmyrcha · commit 18fdb08be24c · 2023-10-24T17:17:16.000+02:00
Signed-off-by: bmyrcha &lt;bartosz.myrcha@intel.com&gt;
diff --git a/examples/notebook/pytorch/Quick_Started_Notebook_of_INC_for_Pytorch.ipynb b/examples/notebook/pytorch/Quick_Started_Notebook_of_INC_for_Pytorch.ipynb
@@ -45,14 +45,15 @@
    "outputs": [],
    "source": [
     "# install neural-compressor from source\n",
+    "import sys\n",
     "!git clone https://github.com/intel/neural-compressor.git\n",
     "%cd ./neural-compressor\n",
-    "!pip install -r requirements.txt\n",
-    "!python setup.py install\n",
+    "!{sys.executable} -m pip install -r requirements.txt\n",
+    "!{sys.executable} setup.py install\n",
     "%cd ..\n",
     "\n",
     "# or install stable basic version from pypi\n",
-    "!pip install neural-compressor"
+    "!{sys.executable} -m pip install neural-compressor\n"
    ]
   },
   {
@@ -62,7 +63,7 @@
    "outputs": [],
    "source": [
     "# install other packages used in this notebook.\n",
-    "!pip install torch>=1.9.0 transformers>=4.16.0 accelerate sympy numpy sentencepiece!=0.1.92 protobuf<=3.20.3 datasets>=1.1.3 scipy scikit-learn Keras-Preprocessing"
+    "!{sys.executable} -m pip install -r requirements.txt\n"
    ]
   },
   {
@@ -102,7 +103,7 @@
     "    AutoTokenizer,\n",
     "    EvalPrediction,\n",
     "    Trainer,\n",
-    ")"
+    ")\n"
    ]
   },
   {
@@ -114,7 +115,7 @@
     "task_name = 'mrpc'\n",
     "raw_datasets = load_dataset(\"glue\", task_name)\n",
     "label_list = raw_datasets[\"train\"].features[\"label\"].names\n",
-    "num_labels = len(label_list)"
+    "num_labels = len(label_list)\n"
    ]
   },
   {
@@ -150,7 +151,7 @@
     "    from_tf=False,\n",
     "    config=config,\n",
     "    use_auth_token=None,\n",
-    ")"
+    ")\n"
    ]
   },
   {
@@ -179,7 +180,7 @@
     "    result = tokenizer(*args, padding=padding, max_length=max_seq_length, truncation=True)\n",
     "    return result\n",
     "\n",
-    "raw_datasets = raw_datasets.map(preprocess_function, batched=True)"
+    "raw_datasets = raw_datasets.map(preprocess_function, batched=True)\n"
    ]
   },
   {
@@ -260,7 +261,7 @@
     "    assert False, \"No metric returned, Please check inference metric!\"\n",
     "\n",
     "def eval_func(model):\n",
-    "    return take_eval_steps(model, trainer)"
+    "    return take_eval_steps(model, trainer)\n"
    ]
   },
   {
@@ -284,7 +285,7 @@
     "from neural_compressor.config import PostTrainingQuantConfig, TuningCriterion\n",
     "tuning_criterion = TuningCriterion(max_trials=600)\n",
     "conf = PostTrainingQuantConfig(approach=\"static\", tuning_criterion=tuning_criterion)\n",
-    "q_model = fit(model, conf=conf, calib_dataloader=eval_dataloader, eval_func=eval_func)"
+    "q_model = fit(model, conf=conf, calib_dataloader=eval_dataloader, eval_func=eval_func)\n"
    ]
   },
   {
@@ -303,10 +304,10 @@
    "outputs": [],
    "source": [
     "# fp32 benchmark\n",
-    "!python benchmark.py --input_model ./pytorch_model.bin 2>&1|tee fp32_benchmark.log\n",
+    "!{sys.executable} benchmark.py --input_model ./pytorch_model.bin 2>&1|tee fp32_benchmark.log\n",
     "\n",
     "# int8 benchmark\n",
-    "!python benchmark.py --input_model ./saved_results/best_model.pt 2>&1|tee int8_benchmark.log\n"
+    "!{sys.executable} benchmark.py --input_model ./saved_results/best_model.pt 2>&1|tee int8_benchmark.log\n"
    ]
   }
  ],
diff --git a/examples/notebook/pytorch/requirements.txt b/examples/notebook/pytorch/requirements.txt
@@ -0,0 +1,11 @@
+torch>=1.9.0
+transformers>=4.16.0
+accelerate
+sympy
+numpy
+sentencepiece!=0.1.92
+protobuf<=3.20.3
+datasets>=1.1.3
+scipy
+scikit-learn
+Keras-Preprocessing

Original file line number	Diff line number	Diff line change
`@@ -45,14 +45,15 @@`
`45`	`45`	`"outputs": [],`
`46`	`46`	`"source": [`
`47`	`47`	`"# install neural-compressor from source\n",`
	`48`	`+ "import sys\n",`
`48`	`49`	`"!git clone https://github.com/intel/neural-compressor.git\n",`
`49`	`50`	`"%cd ./neural-compressor\n",`
`50`		`- "!pip install -r requirements.txt\n",`
`51`		`- "!python setup.py install\n",`
	`51`	`+ "!{sys.executable} -m pip install -r requirements.txt\n",`
	`52`	`+ "!{sys.executable} setup.py install\n",`
`52`	`53`	`"%cd ..\n",`
`53`	`54`	`"\n",`
`54`	`55`	`"# or install stable basic version from pypi\n",`
`55`		`- "!pip install neural-compressor"`
	`56`	`+ "!{sys.executable} -m pip install neural-compressor\n"`
`56`	`57`	`]`
`57`	`58`	`},`
`58`	`59`	`{`
`@@ -62,7 +63,7 @@`
`62`	`63`	`"outputs": [],`
`63`	`64`	`"source": [`
`64`	`65`	`"# install other packages used in this notebook.\n",`
`65`		`- "!pip install torch>=1.9.0 transformers>=4.16.0 accelerate sympy numpy sentencepiece!=0.1.92 protobuf<=3.20.3 datasets>=1.1.3 scipy scikit-learn Keras-Preprocessing"`
	`66`	`+ "!{sys.executable} -m pip install -r requirements.txt\n"`
`66`	`67`	`]`
`67`	`68`	`},`
`68`	`69`	`{`
`@@ -102,7 +103,7 @@`
`102`	`103`	`" AutoTokenizer,\n",`
`103`	`104`	`" EvalPrediction,\n",`
`104`	`105`	`" Trainer,\n",`
`105`		`- ")"`
	`106`	`+ ")\n"`
`106`	`107`	`]`
`107`	`108`	`},`
`108`	`109`	`{`
`@@ -114,7 +115,7 @@`
`114`	`115`	`"task_name = 'mrpc'\n",`
`115`	`116`	`"raw_datasets = load_dataset(\"glue\", task_name)\n",`
`116`	`117`	`"label_list = raw_datasets[\"train\"].features[\"label\"].names\n",`
`117`		`- "num_labels = len(label_list)"`
	`118`	`+ "num_labels = len(label_list)\n"`
`118`	`119`	`]`
`119`	`120`	`},`
`120`	`121`	`{`
`@@ -150,7 +151,7 @@`
`150`	`151`	`" from_tf=False,\n",`
`151`	`152`	`" config=config,\n",`
`152`	`153`	`" use_auth_token=None,\n",`
`153`		`- ")"`
	`154`	`+ ")\n"`
`154`	`155`	`]`
`155`	`156`	`},`
`156`	`157`	`{`
`@@ -179,7 +180,7 @@`
`179`	`180`	`" result = tokenizer(*args, padding=padding, max_length=max_seq_length, truncation=True)\n",`
`180`	`181`	`" return result\n",`
`181`	`182`	`"\n",`
`182`		`- "raw_datasets = raw_datasets.map(preprocess_function, batched=True)"`
	`183`	`+ "raw_datasets = raw_datasets.map(preprocess_function, batched=True)\n"`
`183`	`184`	`]`
`184`	`185`	`},`
`185`	`186`	`{`
`@@ -260,7 +261,7 @@`
`260`	`261`	`" assert False, \"No metric returned, Please check inference metric!\"\n",`
`261`	`262`	`"\n",`
`262`	`263`	`"def eval_func(model):\n",`
`263`		`- " return take_eval_steps(model, trainer)"`
	`264`	`+ " return take_eval_steps(model, trainer)\n"`
`264`	`265`	`]`
`265`	`266`	`},`
`266`	`267`	`{`
`@@ -284,7 +285,7 @@`
`284`	`285`	`"from neural_compressor.config import PostTrainingQuantConfig, TuningCriterion\n",`
`285`	`286`	`"tuning_criterion = TuningCriterion(max_trials=600)\n",`
`286`	`287`	`"conf = PostTrainingQuantConfig(approach=\"static\", tuning_criterion=tuning_criterion)\n",`
`287`		`- "q_model = fit(model, conf=conf, calib_dataloader=eval_dataloader, eval_func=eval_func)"`
	`288`	`+ "q_model = fit(model, conf=conf, calib_dataloader=eval_dataloader, eval_func=eval_func)\n"`
`288`	`289`	`]`
`289`	`290`	`},`
`290`	`291`	`{`
`@@ -303,10 +304,10 @@`
`303`	`304`	`"outputs": [],`
`304`	`305`	`"source": [`
`305`	`306`	`"# fp32 benchmark\n",`
`306`		`- "!python benchmark.py --input_model ./pytorch_model.bin 2>&1\|tee fp32_benchmark.log\n",`
	`307`	`+ "!{sys.executable} benchmark.py --input_model ./pytorch_model.bin 2>&1\|tee fp32_benchmark.log\n",`
`307`	`308`	`"\n",`
`308`	`309`	`"# int8 benchmark\n",`
`309`		`- "!python benchmark.py --input_model ./saved_results/best_model.pt 2>&1\|tee int8_benchmark.log\n"`
	`310`	`+ "!{sys.executable} benchmark.py --input_model ./saved_results/best_model.pt 2>&1\|tee int8_benchmark.log\n"`
`310`	`311`	`]`
`311`	`312`	`}`
`312`	`313`	`],`