fxmarty's picture
add experience
7c7d8a4
[
{
"model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
"task": "token-classification",
"task_args": null,
"dataset": {
"path": "conll2003",
"eval_split": "validation",
"data_keys": {
"primary": "tokens",
"secondary": null
},
"ref_keys": [
"ner_tags"
],
"name": null,
"calibration_split": "train"
},
"quantization_approach": "static",
"operators_to_quantize": [
"Add",
"MatMul"
],
"node_exclusion": [
"layernorm",
"gelu",
"residual",
"gather",
"softmax"
],
"aware_training": false,
"per_channel": false,
"calibration": {
"method": "minmax",
"num_calibration_samples": 100,
"calibration_histogram_percentile": null,
"calibration_moving_average": null,
"calibration_moving_average_constant": null
},
"framework": "onnxruntime",
"framework_args": {
"opset": 11,
"optimization_level": 1
},
"hardware": "Architecture: x86_64\nCPU op-mode(s): 32-bit, 64-bit\nByte Order: Little Endian\nAddress sizes: 46 bits physical, 48 bits virtual\nCPU(s): 8\nOn-line CPU(s) list: 0-7\nThread(s) per core: 2\nCore(s) per socket: 4\nSocket(s): 1\nNUMA node(s): 1\nVendor ID: GenuineIntel\nCPU family: 6\nModel: 85\nModel name: Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping: 7\nCPU MHz: 3099.967\nBogoMIPS: 4999.99\nHypervisor vendor: KVM\nVirtualization type: full\nL1d cache: 128 KiB\nL1i cache: 128 KiB\nL2 cache: 4 MiB\nL3 cache: 35.8 MiB\nNUMA node0 CPU(s): 0-7\nVulnerability Itlb multihit: KVM: Vulnerable\nVulnerability L1tf: Mitigation; PTE Inversion\nVulnerability Mds: Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown: Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1: Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2: Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds: Not affected\nVulnerability Tsx async abort: Not affected\nFlags: fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
"versions": {
"transformers": "4.20.1",
"optimum": "1.2.3.dev0",
"optimum_hash": "5c9af4e5f93c7e9bd523563230732b49603dc4d7"
},
"evaluation": {
"time": [
{
"batch_size": 4,
"input_length": 64,
"baseline": {
"nb_forwards": 125,
"throughput": 8.33,
"latency_mean": 120.533118016,
"latency_std": 0.8359515558530887,
"latency_50": 120.363805,
"latency_90": 121.5990676,
"latency_95": 121.9226278,
"latency_99": 123.02248340000001,
"latency_999": 123.981240332
},
"optimized": {
"nb_forwards": 324,
"throughput": 21.6,
"latency_mean": 46.41411868827161,
"latency_std": 1.7434868124538356,
"latency_50": 46.258802,
"latency_90": 48.954860200000006,
"latency_95": 49.46207725,
"latency_99": 50.02644861,
"latency_999": 50.308738387000005
}
}
],
"others": {
"baseline": {
"precision": 0.9358012339503085,
"recall": 0.9444631437226523,
"f1": 0.9401122372057961,
"accuracy": 0.9882013940267124
},
"optimized": {
"precision": 0.9038969616908851,
"recall": 0.9212386401884888,
"f1": 0.912485414235706,
"accuracy": 0.9842295860753086
}
}
},
"max_eval_samples": null,
"time_benchmark_args": {
"duration": 15,
"warmup_runs": 5
},
"model_type": "distilbert"
},
{
"model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
"task": "token-classification",
"task_args": null,
"dataset": {
"path": "conll2003",
"eval_split": "validation",
"data_keys": {
"primary": "tokens",
"secondary": null
},
"ref_keys": [
"ner_tags"
],
"name": null,
"calibration_split": "train"
},
"quantization_approach": "static",
"operators_to_quantize": [
"Add",
"MatMul"
],
"node_exclusion": [],
"aware_training": false,
"per_channel": false,
"calibration": {
"method": "minmax",
"num_calibration_samples": 100,
"calibration_histogram_percentile": null,
"calibration_moving_average": null,
"calibration_moving_average_constant": null
},
"framework": "onnxruntime",
"framework_args": {
"opset": 11,
"optimization_level": 1
},
"hardware": "Architecture: x86_64\nCPU op-mode(s): 32-bit, 64-bit\nByte Order: Little Endian\nAddress sizes: 46 bits physical, 48 bits virtual\nCPU(s): 8\nOn-line CPU(s) list: 0-7\nThread(s) per core: 2\nCore(s) per socket: 4\nSocket(s): 1\nNUMA node(s): 1\nVendor ID: GenuineIntel\nCPU family: 6\nModel: 85\nModel name: Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping: 7\nCPU MHz: 3100.910\nBogoMIPS: 4999.99\nHypervisor vendor: KVM\nVirtualization type: full\nL1d cache: 128 KiB\nL1i cache: 128 KiB\nL2 cache: 4 MiB\nL3 cache: 35.8 MiB\nNUMA node0 CPU(s): 0-7\nVulnerability Itlb multihit: KVM: Vulnerable\nVulnerability L1tf: Mitigation; PTE Inversion\nVulnerability Mds: Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown: Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1: Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2: Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds: Not affected\nVulnerability Tsx async abort: Not affected\nFlags: fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
"versions": {
"transformers": "4.20.1",
"optimum": "1.2.3.dev0",
"optimum_hash": "5c9af4e5f93c7e9bd523563230732b49603dc4d7"
},
"evaluation": {
"time": [
{
"batch_size": 4,
"input_length": 64,
"baseline": {
"nb_forwards": 126,
"throughput": 8.4,
"latency_mean": 119.97364652380952,
"latency_std": 1.1115995809677575,
"latency_50": 119.8484215,
"latency_90": 121.1081755,
"latency_95": 121.99861425,
"latency_99": 122.6797695,
"latency_999": 124.28595525
},
"optimized": {
"nb_forwards": 253,
"throughput": 16.87,
"latency_mean": 59.49775931225296,
"latency_std": 3.518559570257517,
"latency_50": 58.504581,
"latency_90": 64.1940764,
"latency_95": 66.06759079999999,
"latency_99": 68.27611223999999,
"latency_999": 69.44462915599999
}
}
],
"others": {
"baseline": {
"precision": 0.9358012339503085,
"recall": 0.9444631437226523,
"f1": 0.9401122372057961,
"accuracy": 0.9882013940267124
},
"optimized": {
"precision": 0.06543578604398588,
"recall": 0.24335240659710536,
"f1": 0.10313837375178317,
"accuracy": 0.35697597445582335
}
}
},
"max_eval_samples": null,
"time_benchmark_args": {
"duration": 15,
"warmup_runs": 5
},
"model_type": "distilbert"
}
]