Skip to content
Merged
Show file tree
Hide file tree
Changes from 16 commits
Commits
Show all changes
39 commits
Select commit Hold shift + click to select a range
3eaaa57
add VLM examples
WeiweiZhang1 Sep 26, 2024
8cc273b
bugfix, add utils
WeiweiZhang1 Sep 26, 2024
8597597
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Sep 26, 2024
53b4b32
fix docstring issues
WeiweiZhang1 Sep 26, 2024
f915e49
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Sep 26, 2024
c5127a3
bugfix
WeiweiZhang1 Sep 26, 2024
e3a28e6
resolve bugs
WeiweiZhang1 Sep 26, 2024
6b4c2ff
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Sep 26, 2024
ecd5410
refine examples
WeiweiZhang1 Sep 26, 2024
9212575
fix scan issue
WeiweiZhang1 Sep 26, 2024
533afd0
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Sep 26, 2024
21e1dbb
refine shell
WeiweiZhang1 Sep 26, 2024
64d1b3e
refine scripts & requirements
WeiweiZhang1 Sep 29, 2024
dc368b2
typofix
WeiweiZhang1 Sep 29, 2024
22082df
refine docs
WeiweiZhang1 Sep 30, 2024
4045b36
Merge branch 'master' into add_vlm_examples
WeiweiZhang1 Oct 8, 2024
a3b381d
set attn_implementation for Phi3-vision
WeiweiZhang1 Oct 8, 2024
b827c11
refine phi3 example
WeiweiZhang1 Oct 8, 2024
995c914
Merge branch 'add_vlm_examples' of https://github.com/intel/neural-co…
WeiweiZhang1 Oct 8, 2024
8767ffc
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Oct 8, 2024
afbfcfa
fix code coverage
WeiweiZhang1 Oct 8, 2024
5aa584c
fix code coverage
WeiweiZhang1 Oct 8, 2024
6b8cc73
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Oct 8, 2024
9555321
update config
XuehaoSun Oct 9, 2024
5dcb9bd
refine shells, docs and example. enable qwen2-vl quantization
WeiweiZhang1 Oct 15, 2024
ce514db
Merge branch 'master' into add_vlm_examples
WeiweiZhang1 Oct 15, 2024
335f29e
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Oct 15, 2024
b3bea7f
fix ci
WeiweiZhang1 Oct 15, 2024
33d49e1
fix EOF error
XuehaoSun Oct 17, 2024
414811a
update qwen dir
XuehaoSun Oct 17, 2024
3630267
refine shell, add llama3.2 inference to doc
WeiweiZhang1 Oct 17, 2024
e75719e
refine shell, add llama3.2 inference to doc
WeiweiZhang1 Oct 17, 2024
4190934
bugfix
WeiweiZhang1 Oct 17, 2024
dd9a4be
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Oct 17, 2024
d4cd3bd
bugfix
WeiweiZhang1 Oct 18, 2024
d9193cf
bugfix
WeiweiZhang1 Oct 18, 2024
d4b9f52
refine eval shell
WeiweiZhang1 Oct 18, 2024
dade1f6
fix eval device issue
WeiweiZhang1 Oct 18, 2024
749812c
refine eval dtype
WeiweiZhang1 Oct 18, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
359 changes: 190 additions & 169 deletions examples/.config/model_params_pytorch_3x.json
Original file line number Diff line number Diff line change
@@ -1,172 +1,193 @@
{
"pytorch": {
"opt_125m_woq_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_woq_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_woq_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"gpt_j_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"llama2_7b_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"llama2_7b_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"opt_125m_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"dlrm_ipex": {
"model_src_dir": "recommendation/dlrm/static_quant/ipex",
"dataset_location": "/mnt/local_disk3/dataset/dlrm/dlrm/input",
"input_model": "/mnt/local_disk3/dataset/dlrm/dlrm/dlrm_weight/tb00_40M.pt",
"main_script": "dlrm_s_pytorch.py",
"batch_size": 16384
},
"resnet18_pt2e_static":{
"model_src_dir": "cv/static_quant",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"resnet18_fp8_static":{
"model_src_dir": "cv/fp8_quant",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"opt_125m_pt2e_static":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/pt2e",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"sdxl_ipex_sq":{
"model_src_dir": "diffusion_model/diffusers/stable_diffusion/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"resnet18_mixed_precision": {
"model_src_dir": "cv/mixed_precision",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "resnet18",
"main_script": "main.py",
"batch_size": 20
}
"pytorch": {
"llava_woq_autoround_int4":{
"model_src_dir": "multimodal-modeling/quantization/auto_round/Llava",
"dataset_location": "/tf_dataset2/datasets/coco2017/coco/train2017",
"input_model": "liuhaotian/llava-v1.5-7b",
"main_script": "main.py",
"batch_size": 1
},
"qwenvl_woq_autoround_int4":{
"model_src_dir": "multimodal-modeling/quantization/auto_round/Qwen-VL",
"dataset_location": "/tf_dataset2/datasets/coco2017/coco/train2017",
"input_model": "Qwen/Qwen-VL",
"main_script": "main.py",
"batch_size": 8
},
"Phi3Vision_woq_autoround_int4":{
"model_src_dir": "multimodal-modeling/quantization/auto_round/Phi3-3-vision",
"dataset_location": "/tf_dataset2/datasets/coco2017/coco/train2017",
"input_model": "microsoft/Phi-3-vision-128k-instruct",
"main_script": "main.py",
"batch_size": 1
},
"opt_125m_woq_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_woq_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_woq_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"llama2_7b_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_rtn_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4_dq_bnb":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_woq_gptq_int4_dq_ggml":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/weight_only",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"gpt_j_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"gpt_j_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"llama2_7b_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"llama2_7b_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"opt_125m_ipex":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/ipex",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"opt_125m_ipex_sq":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 8
},
"dlrm_ipex": {
"model_src_dir": "recommendation/dlrm/static_quant/ipex",
"dataset_location": "/mnt/local_disk3/dataset/dlrm/dlrm/input",
"input_model": "/mnt/local_disk3/dataset/dlrm/dlrm/dlrm_weight/tb00_40M.pt",
"main_script": "dlrm_s_pytorch.py",
"batch_size": 16384
},
"resnet18_pt2e_static":{
"model_src_dir": "cv/static_quant",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"resnet18_fp8_static":{
"model_src_dir": "cv/fp8_quant",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"opt_125m_pt2e_static":{
"model_src_dir": "nlp/huggingface_models/language-modeling/quantization/static_quant/pt2e",
"dataset_location": "",
"input_model": "",
"main_script": "run_clm_no_trainer.py",
"batch_size": 1
},
"sdxl_ipex_sq":{
"model_src_dir": "diffusion_model/diffusers/stable_diffusion/smooth_quant",
"dataset_location": "",
"input_model": "",
"main_script": "main.py",
"batch_size": 1
},
"resnet18_mixed_precision": {
"model_src_dir": "cv/mixed_precision",
"dataset_location": "/tf_dataset/pytorch/ImageNet/raw",
"input_model": "resnet18",
"main_script": "main.py",
"batch_size": 20
}
}
}
Loading
Loading