[
    {
        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
        "task": "token-classification",
        "dataset": {
            "path": "conll2003",
            "eval_split": "validation",
            "data_keys": {
                "primary": "tokens",
                "secondary": null
            },
            "ref_keys": [
                "ner_tags"
            ],
            "name": null,
            "calibration_split": "train"
        },
        "quantization_approach": "static",
        "operators_to_quantize": [
            "Add",
            "MatMul"
        ],
        "node_exclusion": [],
        "aware_training": false,
        "per_channel": false,
        "calibration": {
            "method": "minmax",
            "num_calibration_samples": 100,
            "calibration_histogram_percentile": null,
            "calibration_moving_average": null,
            "calibration_moving_average_constant": null
        },
        "framework": "onnxruntime",
        "framework_args": {
            "opset": 11,
            "optimization_level": 1
        },
        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         3100.244\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
        "versions": {
            "transformers": "4.20.1",
            "optimum": "1.2.3.dev0",
            "optimum_hash": "5ac9c0d9fd7e7cca55b2f9935b961ed5b6c50112"
        },
        "evaluation": {
            "time": [
                {
                    "batch_size": 4,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 25,
                        "throughput": 8.33,
                        "latency_mean": 120.23236996,
                        "latency_std": 0.989423927986037,
                        "latency_50": 120.445322,
                        "latency_90": 121.0641136,
                        "latency_95": 121.63786520000001,
                        "latency_99": 122.31954252,
                        "latency_999": 122.47620775200001
                    },
                    "optimized": {
                        "nb_forwards": 53,
                        "throughput": 17.67,
                        "latency_mean": 56.94031537735849,
                        "latency_std": 2.2044830948358625,
                        "latency_50": 56.199388,
                        "latency_90": 60.3284648,
                        "latency_95": 60.6057082,
                        "latency_99": 61.70255691999999,
                        "latency_999": 62.529690292000005
                    }
                },
                {
                    "batch_size": 8,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 19,
                        "throughput": 6.33,
                        "latency_mean": 166.53055257894738,
                        "latency_std": 1.575841987426849,
                        "latency_50": 166.638572,
                        "latency_90": 168.272883,
                        "latency_95": 168.7129504,
                        "latency_99": 169.52801488,
                        "latency_999": 169.711404388
                    },
                    "optimized": {
                        "nb_forwards": 24,
                        "throughput": 8.0,
                        "latency_mean": 129.002869375,
                        "latency_std": 0.6157854643813875,
                        "latency_50": 129.063924,
                        "latency_90": 129.7084936,
                        "latency_95": 129.9355643,
                        "latency_99": 130.24102448,
                        "latency_999": 130.313872748
                    }
                },
                {
                    "batch_size": 1,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 70,
                        "throughput": 23.33,
                        "latency_mean": 43.048573857142856,
                        "latency_std": 1.1204473128323003,
                        "latency_50": 42.845755,
                        "latency_90": 43.8944438,
                        "latency_95": 44.3052485,
                        "latency_99": 46.73122168000001,
                        "latency_999": 49.909082367999986
                    },
                    "optimized": {
                        "nb_forwards": 143,
                        "throughput": 47.67,
                        "latency_mean": 21.113699776223775,
                        "latency_std": 0.1930452254945551,
                        "latency_50": 21.085728,
                        "latency_90": 21.3874956,
                        "latency_95": 21.4500651,
                        "latency_99": 21.640094780000002,
                        "latency_999": 21.648399938
                    }
                }
            ],
            "others": {
                "baseline": {
                    "precision": 0.936836221352711,
                    "recall": 0.9533560864618885,
                    "f1": 0.9450239639131661,
                    "accuracy": 0.9880421708059153
                },
                "optimized": {
                    "precision": 0.07350512058143377,
                    "recall": 0.25312855517633676,
                    "f1": 0.1139272913466462,
                    "accuracy": 0.3629802589683719
                }
            }
        },
        "max_eval_samples": 1000,
        "time_benchmark_args": {
            "duration": 3,
            "warmup_runs": 1
        },
        "model_type": "distilbert"
    },
    {
        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
        "task": "token-classification",
        "dataset": {
            "path": "conll2003",
            "eval_split": "validation",
            "data_keys": {
                "primary": "tokens",
                "secondary": null
            },
            "ref_keys": [
                "ner_tags"
            ],
            "name": null,
            "calibration_split": "train"
        },
        "quantization_approach": "static",
        "operators_to_quantize": [
            "Add"
        ],
        "node_exclusion": [],
        "aware_training": false,
        "per_channel": false,
        "calibration": {
            "method": "minmax",
            "num_calibration_samples": 100,
            "calibration_histogram_percentile": null,
            "calibration_moving_average": null,
            "calibration_moving_average_constant": null
        },
        "framework": "onnxruntime",
        "framework_args": {
            "opset": 11,
            "optimization_level": 1
        },
        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         3100.091\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
        "versions": {
            "transformers": "4.20.1",
            "optimum": "1.2.3.dev0",
            "optimum_hash": "5ac9c0d9fd7e7cca55b2f9935b961ed5b6c50112"
        },
        "evaluation": {
            "time": [
                {
                    "batch_size": 1,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 69,
                        "throughput": 23.0,
                        "latency_mean": 43.50449917391305,
                        "latency_std": 1.1458006326491226,
                        "latency_50": 43.443712,
                        "latency_90": 44.833304,
                        "latency_95": 45.4732784,
                        "latency_99": 46.1717674,
                        "latency_999": 46.293552340000005
                    },
                    "optimized": {
                        "nb_forwards": 80,
                        "throughput": 26.67,
                        "latency_mean": 37.9267952125,
                        "latency_std": 0.11734822683861629,
                        "latency_50": 37.9285515,
                        "latency_90": 38.085207600000004,
                        "latency_95": 38.111036399999996,
                        "latency_99": 38.2064807,
                        "latency_999": 38.22722057
                    }
                },
                {
                    "batch_size": 8,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 14,
                        "throughput": 4.67,
                        "latency_mean": 214.81155885714287,
                        "latency_std": 0.6229026122307055,
                        "latency_50": 214.6879675,
                        "latency_90": 215.571702,
                        "latency_95": 215.72494925,
                        "latency_99": 215.90999385,
                        "latency_999": 215.951628885
                    },
                    "optimized": {
                        "nb_forwards": 12,
                        "throughput": 4.0,
                        "latency_mean": 256.95122358333333,
                        "latency_std": 1.2773226309110695,
                        "latency_50": 257.0572985,
                        "latency_90": 258.7638351,
                        "latency_95": 258.84763195,
                        "latency_99": 258.86815838999996,
                        "latency_999": 258.872776839
                    }
                },
                {
                    "batch_size": 4,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 26,
                        "throughput": 8.67,
                        "latency_mean": 119.1024813076923,
                        "latency_std": 1.5917975126134987,
                        "latency_50": 118.759877,
                        "latency_90": 120.792844,
                        "latency_95": 121.9356475,
                        "latency_99": 123.13953675,
                        "latency_999": 123.40581367499999
                    },
                    "optimized": {
                        "nb_forwards": 23,
                        "throughput": 7.67,
                        "latency_mean": 130.78132304347827,
                        "latency_std": 0.5922745467393132,
                        "latency_50": 130.955147,
                        "latency_90": 131.512009,
                        "latency_95": 131.5393553,
                        "latency_99": 131.74930052,
                        "latency_999": 131.801985152
                    }
                }
            ],
            "others": {
                "baseline": {
                    "precision": 0.936836221352711,
                    "recall": 0.9533560864618885,
                    "f1": 0.9450239639131661,
                    "accuracy": 0.9880421708059153
                },
                "optimized": {
                    "precision": 0.06477812995245642,
                    "recall": 0.18600682593856654,
                    "f1": 0.09609168380840435,
                    "accuracy": 0.3400551899808958
                }
            }
        },
        "max_eval_samples": 1000,
        "time_benchmark_args": {
            "duration": 3,
            "warmup_runs": 1
        },
        "model_type": "distilbert"
    },
    {
        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
        "task": "token-classification",
        "dataset": {
            "path": "conll2003",
            "eval_split": "validation",
            "data_keys": {
                "primary": "tokens",
                "secondary": null
            },
            "ref_keys": [
                "ner_tags"
            ],
            "name": null,
            "calibration_split": "train"
        },
        "quantization_approach": "dynamic",
        "operators_to_quantize": [
            "Add",
            "MatMul"
        ],
        "node_exclusion": [],
        "aware_training": false,
        "per_channel": false,
        "calibration": {
            "method": "minmax",
            "num_calibration_samples": 100,
            "calibration_histogram_percentile": null,
            "calibration_moving_average": null,
            "calibration_moving_average_constant": null
        },
        "framework": "onnxruntime",
        "framework_args": {
            "opset": 11,
            "optimization_level": 1
        },
        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         3100.009\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
        "versions": {
            "transformers": "4.20.1",
            "optimum": "1.2.3.dev0",
            "optimum_hash": "5ac9c0d9fd7e7cca55b2f9935b961ed5b6c50112"
        },
        "evaluation": {
            "time": [
                {
                    "batch_size": 1,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 53,
                        "throughput": 17.67,
                        "latency_mean": 57.63860111320755,
                        "latency_std": 0.5448611043553628,
                        "latency_50": 57.65361,
                        "latency_90": 58.180421,
                        "latency_95": 58.392744,
                        "latency_99": 58.71634352,
                        "latency_999": 58.721444252
                    },
                    "optimized": {
                        "nb_forwards": 244,
                        "throughput": 81.33,
                        "latency_mean": 12.298368512295083,
                        "latency_std": 0.4560740565346141,
                        "latency_50": 12.2116125,
                        "latency_90": 13.001667200000002,
                        "latency_95": 13.1330103,
                        "latency_99": 13.2790208,
                        "latency_999": 13.414312331
                    }
                },
                {
                    "batch_size": 4,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 26,
                        "throughput": 8.67,
                        "latency_mean": 119.50429169230769,
                        "latency_std": 0.4639465722921096,
                        "latency_50": 119.446385,
                        "latency_90": 119.95197,
                        "latency_95": 120.05153425,
                        "latency_99": 120.7893855,
                        "latency_999": 121.00299195000001
                    },
                    "optimized": {
                        "nb_forwards": 76,
                        "throughput": 25.33,
                        "latency_mean": 39.91599960526316,
                        "latency_std": 0.883213781232674,
                        "latency_50": 39.8835755,
                        "latency_90": 41.0755615,
                        "latency_95": 41.48617225,
                        "latency_99": 42.00973875,
                        "latency_999": 42.412953375
                    }
                },
                {
                    "batch_size": 8,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 19,
                        "throughput": 6.33,
                        "latency_mean": 165.83700805263157,
                        "latency_std": 1.7394953701654086,
                        "latency_50": 165.801757,
                        "latency_90": 168.0285054,
                        "latency_95": 168.19460990000002,
                        "latency_99": 168.78632678,
                        "latency_999": 168.919463078
                    },
                    "optimized": {
                        "nb_forwards": 40,
                        "throughput": 13.33,
                        "latency_mean": 75.448955425,
                        "latency_std": 1.2544431966810392,
                        "latency_50": 75.414968,
                        "latency_90": 77.1854282,
                        "latency_95": 77.5299735,
                        "latency_99": 77.80073465000001,
                        "latency_999": 77.95147686499999
                    }
                }
            ],
            "others": {
                "baseline": {
                    "precision": 0.936836221352711,
                    "recall": 0.9533560864618885,
                    "f1": 0.9450239639131661,
                    "accuracy": 0.9880421708059153
                },
                "optimized": {
                    "precision": 0.9368008948545862,
                    "recall": 0.9527872582480091,
                    "f1": 0.9447264523406655,
                    "accuracy": 0.9879006580343876
                }
            }
        },
        "max_eval_samples": 1000,
        "time_benchmark_args": {
            "duration": 3,
            "warmup_runs": 1
        },
        "model_type": "distilbert"
    },
    {
        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
        "task": "token-classification",
        "dataset": {
            "path": "conll2003",
            "eval_split": "validation",
            "data_keys": {
                "primary": "tokens",
                "secondary": null
            },
            "ref_keys": [
                "ner_tags"
            ],
            "name": null,
            "calibration_split": "train"
        },
        "quantization_approach": "dynamic",
        "operators_to_quantize": [
            "Add"
        ],
        "node_exclusion": [],
        "aware_training": false,
        "per_channel": false,
        "calibration": {
            "method": "minmax",
            "num_calibration_samples": 100,
            "calibration_histogram_percentile": null,
            "calibration_moving_average": null,
            "calibration_moving_average_constant": null
        },
        "framework": "onnxruntime",
        "framework_args": {
            "opset": 11,
            "optimization_level": 1
        },
        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         2638.487\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
        "versions": {
            "transformers": "4.20.1",
            "optimum": "1.2.3.dev0",
            "optimum_hash": "5ac9c0d9fd7e7cca55b2f9935b961ed5b6c50112"
        },
        "evaluation": {
            "time": [
                {
                    "batch_size": 1,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 69,
                        "throughput": 23.0,
                        "latency_mean": 43.50526027536232,
                        "latency_std": 1.1770353674252074,
                        "latency_50": 43.267983,
                        "latency_90": 45.0357992,
                        "latency_95": 45.6057136,
                        "latency_99": 46.708998679999986,
                        "latency_999": 47.814713768000004
                    },
                    "optimized": {
                        "nb_forwards": 102,
                        "throughput": 34.0,
                        "latency_mean": 29.424613480392157,
                        "latency_std": 0.14890697595200564,
                        "latency_50": 29.3912705,
                        "latency_90": 29.646715,
                        "latency_95": 29.68545545,
                        "latency_99": 29.80756655,
                        "latency_999": 29.811399894
                    }
                },
                {
                    "batch_size": 4,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 26,
                        "throughput": 8.67,
                        "latency_mean": 119.6179461923077,
                        "latency_std": 1.4057848288153165,
                        "latency_50": 119.394914,
                        "latency_90": 121.3817145,
                        "latency_95": 121.8577975,
                        "latency_99": 122.802906,
                        "latency_999": 123.0513933
                    },
                    "optimized": {
                        "nb_forwards": 28,
                        "throughput": 9.33,
                        "latency_mean": 107.42320235714286,
                        "latency_std": 0.9405205161982765,
                        "latency_50": 107.1847235,
                        "latency_90": 107.6445599,
                        "latency_95": 108.2160214,
                        "latency_99": 111.05779109000001,
                        "latency_999": 111.916852709
                    }
                },
                {
                    "batch_size": 8,
                    "input_length": 64,
                    "baseline": {
                        "nb_forwards": 14,
                        "throughput": 4.67,
                        "latency_mean": 214.6487932857143,
                        "latency_std": 0.9053003539723654,
                        "latency_50": 214.552057,
                        "latency_90": 215.54495519999998,
                        "latency_95": 216.14476715,
                        "latency_99": 216.93365343000002,
                        "latency_999": 217.11115284299999
                    },
                    "optimized": {
                        "nb_forwards": 15,
                        "throughput": 5.0,
                        "latency_mean": 211.41319233333334,
                        "latency_std": 1.1447515204122778,
                        "latency_50": 211.02957,
                        "latency_90": 213.090243,
                        "latency_95": 213.19109559999998,
                        "latency_99": 213.37423912,
                        "latency_999": 213.415446412
                    }
                }
            ],
            "others": {
                "baseline": {
                    "precision": 0.936836221352711,
                    "recall": 0.9533560864618885,
                    "f1": 0.9450239639131661,
                    "accuracy": 0.9880421708059153
                },
                "optimized": {
                    "precision": 0.936836221352711,
                    "recall": 0.9533560864618885,
                    "f1": 0.9450239639131661,
                    "accuracy": 0.9880421708059153
                }
            }
        },
        "max_eval_samples": 1000,
        "time_benchmark_args": {
            "duration": 3,
            "warmup_runs": 1
        },
        "model_type": "distilbert"
    }
]