vic_critP_20pr / benchmarks /experiment_config.json
LLMnewbie's picture
Upload benchmarks/experiment_config.json with huggingface_hub
0649f57 verified
{
"backend": {
"name": "pytorch",
"version": "2.1.2",
"_target_": "optimum_benchmark.backends.pytorch.backend.PyTorchBackend",
"model": "LLMNewbie/vic_critP_20pr",
"task": "text-generation",
"library": "transformers",
"device": "cuda",
"device_ids": "0",
"seed": 42,
"inter_op_num_threads": null,
"intra_op_num_threads": null,
"hub_kwargs": {
"revision": "main",
"force_download": false,
"local_files_only": false,
"trust_remote_code": false
},
"no_weights": true,
"device_map": null,
"torch_dtype": null,
"amp_autocast": false,
"amp_dtype": null,
"eval_mode": true,
"to_bettertransformer": false,
"low_cpu_mem_usage": null,
"attn_implementation": null,
"cache_implementation": null,
"torch_compile": false,
"torch_compile_config": {},
"quantization_scheme": null,
"quantization_config": {},
"deepspeed_inference": false,
"deepspeed_inference_config": {},
"peft_type": null,
"peft_config": {}
},
"launcher": {
"name": "torchrun",
"_target_": "optimum_benchmark.launchers.torchrun.launcher.TorchrunLauncher",
"device_isolation": false,
"min_nodes": 1,
"max_nodes": 1,
"nproc_per_node": 1,
"role": "benchmark_worker",
"monitor_interval": 30,
"rdzv_id": "647201d3-1b63-4512-a68e-b5e519f515bf",
"rdzv_backend": "c10d",
"rdzv_endpoint": "localhost:0",
"rdzv_configs": {
"rank": 0,
"timeout": 900
},
"max_restarts": 0,
"start_method": "spawn",
"log_dir": null,
"redirects": "0",
"tee": "0",
"metrics_cfg": {},
"local_addr": null
},
"benchmark": {
"name": "inference",
"_target_": "optimum_benchmark.benchmarks.inference.benchmark.InferenceBenchmark",
"duration": 10,
"warmup_runs": 10,
"input_shapes": {
"batch_size": 2,
"num_choices": 2,
"sequence_length": 16
},
"new_tokens": null,
"latency": true,
"memory": true,
"energy": false,
"forward_kwargs": {},
"generate_kwargs": {},
"call_kwargs": {}
},
"experiment_name": "api-launch",
"task": null,
"model": null,
"device": null,
"library": null,
"environment": {
"cpu": " Intel(R) Xeon(R) Gold 6448Y",
"cpu_count": 16,
"cpu_ram_mb": 237491.42528,
"system": "Linux",
"machine": "x86_64",
"platform": "Linux-5.15.0-86-generic-x86_64-with-glibc2.35",
"processor": "x86_64",
"python_version": "3.10.12",
"gpu": [
"NVIDIA H100 80GB HBM3"
],
"gpu_count": 1,
"gpu_vram_mb": 85520809984,
"optimum_benchmark_version": "0.2.0",
"optimum_benchmark_commit": "9141f5b68a70cab5d9d5698b5bcefafd0c07270f",
"transformers_version": "4.39.1",
"transformers_commit": null,
"accelerate_version": "0.25.0",
"accelerate_commit": null,
"diffusers_version": "0.15.0",
"diffusers_commit": null,
"optimum_version": "1.17.1",
"optimum_commit": null,
"timm_version": null,
"timm_commit": null,
"peft_version": "0.9.0",
"peft_commit": null
}
}