|
{ |
|
"backend": { |
|
"name": "pytorch", |
|
"version": "2.2.1+cu118", |
|
"_target_": "optimum_benchmark.backends.pytorch.backend.PyTorchBackend", |
|
"model": "gpt2", |
|
"task": "text-generation", |
|
"library": "transformers", |
|
"device": "cuda", |
|
"device_ids": "0", |
|
"seed": 42, |
|
"inter_op_num_threads": null, |
|
"intra_op_num_threads": null, |
|
"hub_kwargs": { |
|
"revision": "main", |
|
"force_download": false, |
|
"local_files_only": false, |
|
"trust_remote_code": false |
|
}, |
|
"no_weights": true, |
|
"device_map": null, |
|
"torch_dtype": null, |
|
"amp_autocast": false, |
|
"amp_dtype": null, |
|
"eval_mode": true, |
|
"to_bettertransformer": false, |
|
"low_cpu_mem_usage": null, |
|
"attn_implementation": null, |
|
"cache_implementation": null, |
|
"torch_compile": false, |
|
"torch_compile_config": {}, |
|
"quantization_scheme": null, |
|
"quantization_config": {}, |
|
"deepspeed_inference": false, |
|
"deepspeed_inference_config": {}, |
|
"peft_type": null, |
|
"peft_config": {} |
|
}, |
|
"launcher": { |
|
"name": "process", |
|
"_target_": "optimum_benchmark.launchers.process.launcher.ProcessLauncher", |
|
"device_isolation": false, |
|
"start_method": "spawn" |
|
}, |
|
"benchmark": { |
|
"name": "inference", |
|
"_target_": "optimum_benchmark.benchmarks.inference.benchmark.InferenceBenchmark", |
|
"duration": 10, |
|
"warmup_runs": 10, |
|
"input_shapes": { |
|
"batch_size": 2, |
|
"num_choices": 2, |
|
"sequence_length": 16 |
|
}, |
|
"new_tokens": null, |
|
"energy": false, |
|
"memory": false, |
|
"latency": true, |
|
"forward_kwargs": {}, |
|
"generate_kwargs": {}, |
|
"call_kwargs": {} |
|
}, |
|
"experiment_name": "test", |
|
"task": null, |
|
"model": null, |
|
"device": null, |
|
"library": null, |
|
"environment": { |
|
"cpu": " AMD EPYC 7742 64-Core Processor", |
|
"cpu_count": 128, |
|
"cpu_ram_mb": 540671.627264, |
|
"system": "Linux", |
|
"machine": "x86_64", |
|
"platform": "Linux-5.4.0-166-generic-x86_64-with-glibc2.35", |
|
"processor": "x86_64", |
|
"python_version": "3.10.12", |
|
"gpu": [ |
|
"NVIDIA A100-SXM4-80GB", |
|
"NVIDIA A100-SXM4-80GB", |
|
"NVIDIA A100-SXM4-80GB", |
|
"NVIDIA DGX Display", |
|
"NVIDIA A100-SXM4-80GB" |
|
], |
|
"gpu_count": 5, |
|
"gpu_vram_mb": 347892350976, |
|
"optimum_benchmark_version": "0.2.0", |
|
"optimum_benchmark_commit": "99c4ad891865d24ebb865cc853e21127a1872efe", |
|
"transformers_version": "4.38.2", |
|
"transformers_commit": null, |
|
"accelerate_version": "0.27.2", |
|
"accelerate_commit": null, |
|
"diffusers_version": null, |
|
"diffusers_commit": null, |
|
"optimum_version": null, |
|
"optimum_commit": null, |
|
"timm_version": null, |
|
"timm_commit": null, |
|
"peft_version": null, |
|
"peft_commit": null |
|
} |
|
} |