Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
79 commits
Select commit Hold shift + click to select a range
2b648f1
added code in utils.py-docker
kobby-kobbs Jun 14, 2023
0a9be4b
created scripts and test file to run on CI
kobby-kobbs Jun 21, 2023
67cbb2d
Merge remote-tracking branch 'origin/main' into emmanuel/perf_monitoring
kobby-kobbs Jun 21, 2023
f1d0f63
fixed bug in Makefile
kobby-kobbs Jun 22, 2023
876329b
fixed bug in Makefile
kobby-kobbs Jun 22, 2023
94837c7
fixing bug in Makefile
kobby-kobbs Jun 22, 2023
ae8692f
fixing bug in Makefile
kobby-kobbs Jun 22, 2023
4c52adf
fixing bug in Makefile
kobby-kobbs Jun 22, 2023
3602c4e
changed search algorithm in json
kobby-kobbs Jun 24, 2023
6a8e79b
testing for best metrics on vm
kobby-kobbs Jun 28, 2023
6293ac4
w wrote script for extracting best model
kobby-kobbs Jun 29, 2023
13ba055
w wrote script for extracting best model
kobby-kobbs Jun 29, 2023
adecf5c
fixing error in CamemBERT test
kobby-kobbs Jul 6, 2023
fb26ff5
fixing error in CamemBERT test
kobby-kobbs Jul 6, 2023
0fd885b
updated camembert to use user_script
kobby-kobbs Jul 6, 2023
356634e
fixing error in text-classification models test
kobby-kobbs Jul 13, 2023
bc60753
pushing to test on pipeline
kobby-kobbs Jul 17, 2023
182862d
fixed script name error in makefile
kobby-kobbs Jul 17, 2023
ea7adb3
fixed script name error in makefile
kobby-kobbs Jul 17, 2023
5ad2066
fixed olive run error
kobby-kobbs Jul 17, 2023
e0f096d
testing 2 models
kobby-kobbs Jul 17, 2023
0ab5f57
testing bert model
kobby-kobbs Jul 17, 2023
bf366cf
fixing error on bert model
kobby-kobbs Jul 17, 2023
a1fa792
Merge branch 'main' into emmanuel/perf_monitoring
kobby-kobbs Jul 17, 2023
3baf699
making changes
kobby-kobbs Jul 17, 2023
4dffbf3
testing 5 models on pipeline
kobby-kobbs Jul 17, 2023
2aebc07
Merge branch 'main' into emmanuel/perf_monitoring
kobby-kobbs Jul 21, 2023
8306920
testing env variable on pipeline
kobby-kobbs Jul 21, 2023
215a134
testing env variable on pipeline
kobby-kobbs Jul 21, 2023
af855fc
testing env variable on pipeline
kobby-kobbs Jul 21, 2023
24da9bc
staging commits
kobby-kobbs Jul 24, 2023
88f9e2f
Merge branch 'main' into emmanuel/perf_monitoring
kobby-kobbs Jul 24, 2023
5cde016
expose data_files in hf load_dataset
jambayk Jul 24, 2023
210f709
add max_samples to huggingface data config
jambayk Jul 24, 2023
ff8ec9e
changes
kobby-kobbs Jul 24, 2023
415948c
Merge branch 'jambayk/update-hf-data' into emmanuel/perf_monitoring
kobby-kobbs Jul 25, 2023
86dbc28
changes
kobby-kobbs Jul 25, 2023
8f3f6ea
fixing merge conflict
kobby-kobbs Jul 25, 2023
e53ca5d
fixing merge conflict
kobby-kobbs Jul 25, 2023
680037f
fixing merge conflict
kobby-kobbs Jul 25, 2023
445f000
setting up env variable
kobby-kobbs Jul 26, 2023
8e7e21a
adding extra files
kobby-kobbs Jul 26, 2023
bd4dd28
adding extra files
kobby-kobbs Jul 26, 2023
f7dec68
adding extra files
kobby-kobbs Jul 27, 2023
812a264
adding extra files
kobby-kobbs Jul 27, 2023
754a889
cleaning up code
kobby-kobbs Jul 27, 2023
54d9b1a
cleaning up pipeline
kobby-kobbs Jul 27, 2023
4465d28
final changes made
kobby-kobbs Jul 27, 2023
c8716cd
final changes made
kobby-kobbs Jul 27, 2023
839eb50
final changes made
kobby-kobbs Jul 28, 2023
ae197be
made changes to models and metrics
kobby-kobbs Aug 4, 2023
7404da5
made changes to models tolerance
kobby-kobbs Aug 4, 2023
579325e
updated models search
kobby-kobbs Aug 4, 2023
9c05d3a
updated models and fixed error
kobby-kobbs Aug 4, 2023
db38fa8
updated models and fixed error
kobby-kobbs Aug 4, 2023
1fed3ae
updated samples for roberta
kobby-kobbs Aug 5, 2023
27a27cc
updated tolerance code
kobby-kobbs Aug 6, 2023
ae2683a
updated tolerance
kobby-kobbs Aug 6, 2023
1c775ce
updated toleranc
kobby-kobbs Aug 6, 2023
a26087b
updated utils
kobby-kobbs Aug 7, 2023
0d5cd97
updates made to utils
kobby-kobbs Aug 7, 2023
c3a890d
Merge branch 'main' into emmanuel/perf_monitoring
kobby-kobbs Aug 9, 2023
6e52648
merge main
xiaoyu-work Sep 26, 2023
56afa70
save
xiaoyu-work Sep 28, 2023
f573b9c
Merge branch 'main' of github.com:microsoft/Olive into emmanuel/perf_…
xiaoyu-work Sep 28, 2023
8eae2a6
rebase main
xiaoyu-work Oct 10, 2023
776add7
Merge branch 'main' of github.com:microsoft/Olive into emmanuel/perf_…
xiaoyu-work Oct 10, 2023
da35cbe
merge regression check pipeline to performance check pipeline
xiaoyu-work Oct 10, 2023
d9a40b3
update config
xiaoyu-work Oct 10, 2023
a1379cc
Update hf model map
xiaoyu-work Oct 10, 2023
b805264
update config
xiaoyu-work Oct 10, 2023
ed9a6f3
remove unused files
xiaoyu-work Oct 10, 2023
19a1e92
update comments
xiaoyu-work Oct 10, 2023
e81c8bf
remove deberta latency goal
xiaoyu-work Oct 10, 2023
9ae9387
update metric
xiaoyu-work Oct 11, 2023
843384b
update metric value
xiaoyu-work Oct 11, 2023
d376750
update log
xiaoyu-work Oct 11, 2023
432d4f5
update data for new cpu
xiaoyu-work Oct 11, 2023
9d489c2
Merge branch 'main' of https://github.com/microsoft/Olive into emmanu…
xiaoyu-work Oct 12, 2023
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
62 changes: 62 additions & 0 deletions .azure_pipelines/performance_check/best_metrics.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,62 @@
{
"bert": {
"cpu": {
"accuracy-accuracy": 0.88,
"latency-avg": {
"8272CL": 15.5,
"E5-2673": 44.5,
"8171M": 20.89,
"8370C": 18
}
},
"gpu": {
"accuracy-accuracy": 0.9,
"latency-avg": 1.61
}
},
"deberta": {
"cpu": {
"accuracy-accuracy": 0.84,
"latency-avg": {
"8272CL": 57.74,
"E5-2673": 117.00,
"8171M": 93.37,
"8370C": 0
}
},
"gpu": {
"accuracy-accuracy": 0.88,
"latency-avg": 8.011
}
},
"distilbert": {
"cpu": {
"accuracy-accuracy": 0.94,
"latency-avg": {
"8272CL": 4.5,
"E5-2673": 11.0,
"8171M": 5.9,
"8370C": 4.57
}
},
"gpu": {
"accuracy-accuracy": 0.94,
"latency-avg": 0.91
}
},
"roberta_large": {
"cpu": {
"accuracy-accuracy": 0.88,
"latency-avg": {
"8272CL": 52.38,
"E5-2673": 140.34,
"8171M": 69.33,
"8370C": 0
}
},
"gpu": {
"accuracy-accuracy": 0.89,
"latency-avg": 6.164
}
}
}
10 changes: 4 additions & 6 deletions .azure_pipelines/performance_check/configs/bert.json
Original file line number Diff line number Diff line change
Expand Up @@ -25,15 +25,13 @@
"type": "accuracy",
"backend": "huggingface_metrics",
"sub_types": [
{"name": "accuracy", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}}
]
{"name": "accuracy", "priority": 1, "goal": {"type": "max-degradation", "value": 0.05}} ]
},
{
"name": "latency",
"type": "latency",
"sub_types": [
{"name": "avg", "priority": 2, "goal": {"type": "percent-min-improvement", "value": 20}}
]
{"name": "avg", "priority": 2, "goal": {"type": "percent-min-improvement", "value": 5}} ]
}
]
}
Expand Down Expand Up @@ -81,7 +79,7 @@
"clean_cache": true,
"evaluator": "common_evaluator",
"execution_providers": ["CPUExecutionProvider"],
"cache_dir": "cache",
"output_dir" : "models/bert_ptq"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/bert_ptq"
}
}
7 changes: 2 additions & 5 deletions .azure_pipelines/performance_check/configs/bert_gpu.json
Original file line number Diff line number Diff line change
Expand Up @@ -49,9 +49,6 @@
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": true
}
},
Expand Down Expand Up @@ -79,7 +76,7 @@
"evaluator": "common_evaluator",
"execution_providers": ["CUDAExecutionProvider"],
"clean_cache": true,
"cache_dir": "cache",
"output_dir" : "models/bert_gpu"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/bert_gpu"
}
}
15 changes: 5 additions & 10 deletions .azure_pipelines/performance_check/configs/deberta.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@
"type": "accuracy",
"backend": "huggingface_metrics",
"sub_types": [
{"name": "accuracy", "priority": 1}
{"name": "accuracy", "priority": 1, "goal": {"type": "max-degradation", "value": 0.05}}

]
},
Expand All @@ -53,17 +53,12 @@
},
"transformers_optimization": {
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": false
}
"disable_search": true
},
"quantization": {
"type": "OnnxQuantization",
"config": {
"quant_mode": "dynamic",
"quant_preprocess": true,
"data_config": "__input_model_data_config__"
}
Expand All @@ -87,7 +82,7 @@
"clean_cache": true,
"evaluator": "common_evaluator",
"execution_providers": ["CPUExecutionProvider"],
"cache_dir": "cache",
"output_dir" : "models/microsoft-deberta"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/microsoft-deberta"
}
}
11 changes: 4 additions & 7 deletions .azure_pipelines/performance_check/configs/deberta_gpu.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,15 +30,15 @@
"type": "accuracy",
"backend": "huggingface_metrics",
"sub_types": [
{"name": "accuracy", "priority": 1}
{"name": "accuracy", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}}

]
},
{
"name": "latency",
"type": "latency",
"sub_types": [
{"name": "avg", "priority": 2}
{"name": "avg", "priority": 2, "goal": {"type": "percent-min-improvement", "value": 20}}
]
}
]
Expand All @@ -55,9 +55,6 @@
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": true
}
},
Expand Down Expand Up @@ -85,7 +82,7 @@
"clean_cache": true,
"evaluator": "common_evaluator",
"execution_providers": ["CUDAExecutionProvider"],
"cache_dir": "cache",
"output_dir" : "models/microsoft-deberta_cuda"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/microsoft-deberta_cuda"
}
}
17 changes: 6 additions & 11 deletions .azure_pipelines/performance_check/configs/distilbert.json
Original file line number Diff line number Diff line change
Expand Up @@ -26,14 +26,14 @@
"type": "accuracy",
"backend": "huggingface_metrics",
"sub_types": [
{"name": "accuracy", "priority": 1}
{"name": "accuracy", "priority": 1, "goal": {"type": "max-degradation", "value": 0.01}}
]
},
{
"name": "latency",
"type": "latency",
"sub_types": [
{"name": "avg", "priority": 2}
{"name": "avg", "priority": 2, "goal": {"type": "percent-min-improvement", "value": 20}}
]
}
]
Expand All @@ -48,13 +48,7 @@
},
"transformers_optimization": {
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": false
}
"disable_search": true
},
"quantization": {
"type": "OnnxQuantization",
Expand All @@ -79,10 +73,11 @@
"seed": 0
}
},
"log_severity_level": 0,
"clean_cache": true,
"evaluator": "common_evaluator",
"execution_providers": ["CPUExecutionProvider"],
"cache_dir": "cache",
"output_dir" : "models/distilbert"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/distilbert"
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -49,9 +49,6 @@
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": true
}
},
Expand Down Expand Up @@ -79,7 +76,7 @@
"evaluator": "common_evaluator",
"execution_providers": ["CUDAExecutionProvider"],
"clean_cache": true,
"cache_dir": "cache",
"output_dir" : "models/distilbert_cuda"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/distilbert_cuda"
}
}
12 changes: 3 additions & 9 deletions .azure_pipelines/performance_check/configs/roberta_large.json
Original file line number Diff line number Diff line change
Expand Up @@ -52,13 +52,7 @@
},
"transformers_optimization": {
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": false
}
"disable_search": true
},
"quantization": {
"type": "OnnxQuantization",
Expand Down Expand Up @@ -86,7 +80,7 @@
"clean_cache": true,
"evaluator": "common_evaluator",
"execution_providers": ["CPUExecutionProvider"],
"cache_dir": "cache",
"output_dir" : "models/roberta_large"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/roberta_large"
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -54,9 +54,6 @@
"type": "OrtTransformersOptimization",
"disable_search": true,
"config": {
"model_type": "bert",
"num_heads": 12,
"hidden_size": 768,
"float16": true
}
},
Expand Down Expand Up @@ -84,7 +81,7 @@
"evaluator": "common_evaluator",
"execution_providers": ["CUDAExecutionProvider"],
"clean_cache": true,
"cache_dir": "cache",
"output_dir" : "models/roberta_large"
"cache_dir": "run_cache/olive/cache",
"output_dir" : "run_cache/olive/roberta_large"
}
}
Loading