add experience

Browse files

Files changed (5) hide show

README.md +59 -0
runs.json +196 -0
tensorboard/1657707611.2962544/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.1 +3 -0
tensorboard/1657707611.2976747/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.2 +3 -0
tensorboard/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.0 +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,59 @@

+---
+pipeline_tag: token-classification
+datasets:
+- conll2003
+metrics:
+- precision
+- recall
+- f1
+- accuracy
+tags:
+- distilbert
+---
+**task**: `token-classification`
+**Backend:** `sagemaker-training`
+**Backend args:** `{'instance_type': 'ml.g4dn.2xlarge', 'supported_instructions': None}`
+**Number of evaluation samples:** `All dataset`
+Fixed parameters:
+* **model_name_or_path**: `elastic/distilbert-base-uncased-finetuned-conll03-english`
+* **dataset**:
+    * **path**: `conll2003`
+    * **eval_split**: `validation`
+    * **data_keys**: `{'primary': 'tokens'}`
+    * **ref_keys**: `['ner_tags']`
+    * **calibration_split**: `train`
+* **quantization_approach**: `static`
+* **operators_to_quantize**: `['Add', 'MatMul']`
+* **per_channel**: `False`
+* **calibration**:
+    * **method**: `minmax`
+    * **num_calibration_samples**: `100`
+* **framework**: `onnxruntime`
+* **framework_args**:
+    * **opset**: `11`
+    * **optimization_level**: `1`
+* **aware_training**: `False`
+Benchmarked parameters:
+* **node_exclusion**: `[]`,  `['layernorm', 'gelu', 'residual', 'gather', 'softmax']`
+# Evaluation
+## Non-time metrics
+|                      node_exclusion                      |     | precision (original) | precision (optimized) |     | recall (original) | recall (optimized) |     | f1 (original) | f1 (optimized) |     | accuracy (original) | accuracy (optimized) |
+| :------------------------------------------------------: | :-: | :------------------: | :-------------------: | :-: | :---------------: | :----------------: | :-: | :-----------: | :------------: | :-: | :-----------------: | :------------------: |
+| `['layernorm', 'gelu', 'residual', 'gather', 'softmax']` |  \|  |        0.936         |         0.904         |  \|  |       0.944       |       0.921        |  \|  |     0.940     |     0.912      |  \|  |        0.988        |        0.984         |
+|                           `[]`                           |  \|  |        0.936         |         0.065         |  \|  |       0.944       |       0.243        |  \|  |     0.940     |     0.103      |  \|  |        0.988        |        0.357         |
+## Time metrics
+Time benchmarks were run for 15 seconds per config.
+Below, time metrics for batch size = 4, input length = 64.
+|                      node_exclusion                      |     | latency_mean (original, ms) | latency_mean (optimized, ms) |     | throughput (original, /s) | throughput (optimized, /s) |
+| :------------------------------------------------------: | :-: | :-------------------------: | :--------------------------: | :-: | :-----------------------: | :------------------------: |
+| `['layernorm', 'gelu', 'residual', 'gather', 'softmax']` |  \|  |           120.53            |            46.41             |  \|  |           8.33            |           21.60            |
+|                           `[]`                           |  \|  |           119.97            |            59.50             |  \|  |           8.40            |           16.87            |

runs.json ADDED Viewed

	@@ -0,0 +1,196 @@

+[
+    {
+        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
+        "task": "token-classification",
+        "task_args": null,
+        "dataset": {
+            "path": "conll2003",
+            "eval_split": "validation",
+            "data_keys": {
+                "primary": "tokens",
+                "secondary": null
+            },
+            "ref_keys": [
+                "ner_tags"
+            ],
+            "name": null,
+            "calibration_split": "train"
+        },
+        "quantization_approach": "static",
+        "operators_to_quantize": [
+            "Add",
+            "MatMul"
+        ],
+        "node_exclusion": [
+            "layernorm",
+            "gelu",
+            "residual",
+            "gather",
+            "softmax"
+        ],
+        "aware_training": false,
+        "per_channel": false,
+        "calibration": {
+            "method": "minmax",
+            "num_calibration_samples": 100,
+            "calibration_histogram_percentile": null,
+            "calibration_moving_average": null,
+            "calibration_moving_average_constant": null
+        },
+        "framework": "onnxruntime",
+        "framework_args": {
+            "opset": 11,
+            "optimization_level": 1
+        },
+        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         3099.967\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
+        "versions": {
+            "transformers": "4.20.1",
+            "optimum": "1.2.3.dev0",
+            "optimum_hash": "5c9af4e5f93c7e9bd523563230732b49603dc4d7"
+        },
+        "evaluation": {
+            "time": [
+                {
+                    "batch_size": 4,
+                    "input_length": 64,
+                    "baseline": {
+                        "nb_forwards": 125,
+                        "throughput": 8.33,
+                        "latency_mean": 120.533118016,
+                        "latency_std": 0.8359515558530887,
+                        "latency_50": 120.363805,
+                        "latency_90": 121.5990676,
+                        "latency_95": 121.9226278,
+                        "latency_99": 123.02248340000001,
+                        "latency_999": 123.981240332
+                    },
+                    "optimized": {
+                        "nb_forwards": 324,
+                        "throughput": 21.6,
+                        "latency_mean": 46.41411868827161,
+                        "latency_std": 1.7434868124538356,
+                        "latency_50": 46.258802,
+                        "latency_90": 48.954860200000006,
+                        "latency_95": 49.46207725,
+                        "latency_99": 50.02644861,
+                        "latency_999": 50.308738387000005
+                    }
+                }
+            ],
+            "others": {
+                "baseline": {
+                    "precision": 0.9358012339503085,
+                    "recall": 0.9444631437226523,
+                    "f1": 0.9401122372057961,
+                    "accuracy": 0.9882013940267124
+                },
+                "optimized": {
+                    "precision": 0.9038969616908851,
+                    "recall": 0.9212386401884888,
+                    "f1": 0.912485414235706,
+                    "accuracy": 0.9842295860753086
+                }
+            }
+        },
+        "max_eval_samples": null,
+        "time_benchmark_args": {
+            "duration": 15,
+            "warmup_runs": 5
+        },
+        "model_type": "distilbert"
+    },
+    {
+        "model_name_or_path": "elastic/distilbert-base-uncased-finetuned-conll03-english",
+        "task": "token-classification",
+        "task_args": null,
+        "dataset": {
+            "path": "conll2003",
+            "eval_split": "validation",
+            "data_keys": {
+                "primary": "tokens",
+                "secondary": null
+            },
+            "ref_keys": [
+                "ner_tags"
+            ],
+            "name": null,
+            "calibration_split": "train"
+        },
+        "quantization_approach": "static",
+        "operators_to_quantize": [
+            "Add",
+            "MatMul"
+        ],
+        "node_exclusion": [],
+        "aware_training": false,
+        "per_channel": false,
+        "calibration": {
+            "method": "minmax",
+            "num_calibration_samples": 100,
+            "calibration_histogram_percentile": null,
+            "calibration_moving_average": null,
+            "calibration_moving_average_constant": null
+        },
+        "framework": "onnxruntime",
+        "framework_args": {
+            "opset": 11,
+            "optimization_level": 1
+        },
+        "hardware": "Architecture:                    x86_64\nCPU op-mode(s):                  32-bit, 64-bit\nByte Order:                      Little Endian\nAddress sizes:                   46 bits physical, 48 bits virtual\nCPU(s):                          8\nOn-line CPU(s) list:             0-7\nThread(s) per core:              2\nCore(s) per socket:              4\nSocket(s):                       1\nNUMA node(s):                    1\nVendor ID:                       GenuineIntel\nCPU family:                      6\nModel:                           85\nModel name:                      Intel(R) Xeon(R) Platinum 8259CL CPU @ 2.50GHz\nStepping:                        7\nCPU MHz:                         3100.910\nBogoMIPS:                        4999.99\nHypervisor vendor:               KVM\nVirtualization type:             full\nL1d cache:                       128 KiB\nL1i cache:                       128 KiB\nL2 cache:                        4 MiB\nL3 cache:                        35.8 MiB\nNUMA node0 CPU(s):               0-7\nVulnerability Itlb multihit:     KVM: Vulnerable\nVulnerability L1tf:              Mitigation; PTE Inversion\nVulnerability Mds:               Vulnerable: Clear CPU buffers attempted, no microcode; SMT Host state unknown\nVulnerability Meltdown:          Mitigation; PTI\nVulnerability Spec store bypass: Vulnerable\nVulnerability Spectre v1:        Mitigation; usercopy/swapgs barriers and __user pointer sanitization\nVulnerability Spectre v2:        Mitigation; Retpolines, STIBP disabled, RSB filling\nVulnerability Srbds:             Not affected\nVulnerability Tsx async abort:   Not affected\nFlags:                           fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ss ht syscall nx pdpe1gb rdtscp lm constant_tsc rep_good nopl xtopology nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq ssse3 fma cx16 pcid sse4_1 sse4_2 x2apic movbe popcnt tsc_deadline_timer aes xsave avx f16c rdrand hypervisor lahf_lm abm 3dnowprefetch invpcid_single pti fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid mpx avx512f avx512dq rdseed adx smap clflushopt clwb avx512cd avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves ida arat pku ospke avx512_vnni\n",
+        "versions": {
+            "transformers": "4.20.1",
+            "optimum": "1.2.3.dev0",
+            "optimum_hash": "5c9af4e5f93c7e9bd523563230732b49603dc4d7"
+        },
+        "evaluation": {
+            "time": [
+                {
+                    "batch_size": 4,
+                    "input_length": 64,
+                    "baseline": {
+                        "nb_forwards": 126,
+                        "throughput": 8.4,
+                        "latency_mean": 119.97364652380952,
+                        "latency_std": 1.1115995809677575,
+                        "latency_50": 119.8484215,
+                        "latency_90": 121.1081755,
+                        "latency_95": 121.99861425,
+                        "latency_99": 122.6797695,
+                        "latency_999": 124.28595525
+                    },
+                    "optimized": {
+                        "nb_forwards": 253,
+                        "throughput": 16.87,
+                        "latency_mean": 59.49775931225296,
+                        "latency_std": 3.518559570257517,
+                        "latency_50": 58.504581,
+                        "latency_90": 64.1940764,
+                        "latency_95": 66.06759079999999,
+                        "latency_99": 68.27611223999999,
+                        "latency_999": 69.44462915599999
+                    }
+                }
+            ],
+            "others": {
+                "baseline": {
+                    "precision": 0.9358012339503085,
+                    "recall": 0.9444631437226523,
+                    "f1": 0.9401122372057961,
+                    "accuracy": 0.9882013940267124
+                },
+                "optimized": {
+                    "precision": 0.06543578604398588,
+                    "recall": 0.24335240659710536,
+                    "f1": 0.10313837375178317,
+                    "accuracy": 0.35697597445582335
+                }
+            }
+        },
+        "max_eval_samples": null,
+        "time_benchmark_args": {
+            "duration": 15,
+            "warmup_runs": 5
+        },
+        "model_type": "distilbert"
+    }
+]

tensorboard/1657707611.2962544/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ce86125e8a636be39bff10bff27849d2a71abd354b6c809d87f862403119453
+size 696

tensorboard/1657707611.2976747/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:38bb5da1b600d8842d3d85a2b2104775dd0f3b1beddbfd60fe8de0f5c5522440
+size 644

tensorboard/events.out.tfevents.1657707611.ip-10-2-64-206.ec2.internal.1.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5315e44ede4671066360385cecf9da4cae04e4f04d0d27849665f6a042e0969d
+size 40