vic_critP_20pr / benchmarks /experiment_config.json

Upload benchmarks/experiment_config.json with huggingface_hub

0649f57 verified about 1 year ago

3.55 kB

	{
	"backend": {
	"name": "pytorch",
	"version": "2.1.2",
	"_target_": "optimum_benchmark.backends.pytorch.backend.PyTorchBackend",
	"model": "LLMNewbie/vic_critP_20pr",
	"task": "text-generation",
	"library": "transformers",
	"device": "cuda",
	"device_ids": "0",
	"seed": 42,
	"inter_op_num_threads": null,
	"intra_op_num_threads": null,
	"hub_kwargs": {
	"revision": "main",
	"force_download": false,
	"local_files_only": false,
	"trust_remote_code": false
	},
	"no_weights": true,
	"device_map": null,
	"torch_dtype": null,
	"amp_autocast": false,
	"amp_dtype": null,
	"eval_mode": true,
	"to_bettertransformer": false,
	"low_cpu_mem_usage": null,
	"attn_implementation": null,
	"cache_implementation": null,
	"torch_compile": false,
	"torch_compile_config": {},
	"quantization_scheme": null,
	"quantization_config": {},
	"deepspeed_inference": false,
	"deepspeed_inference_config": {},
	"peft_type": null,
	"peft_config": {}
	},
	"launcher": {
	"name": "torchrun",
	"_target_": "optimum_benchmark.launchers.torchrun.launcher.TorchrunLauncher",
	"device_isolation": false,
	"min_nodes": 1,
	"max_nodes": 1,
	"nproc_per_node": 1,
	"role": "benchmark_worker",
	"monitor_interval": 30,
	"rdzv_id": "647201d3-1b63-4512-a68e-b5e519f515bf",
	"rdzv_backend": "c10d",
	"rdzv_endpoint": "localhost:0",
	"rdzv_configs": {
	"rank": 0,
	"timeout": 900
	},
	"max_restarts": 0,
	"start_method": "spawn",
	"log_dir": null,
	"redirects": "0",
	"tee": "0",
	"metrics_cfg": {},
	"local_addr": null
	},
	"benchmark": {
	"name": "inference",
	"_target_": "optimum_benchmark.benchmarks.inference.benchmark.InferenceBenchmark",
	"duration": 10,
	"warmup_runs": 10,
	"input_shapes": {
	"batch_size": 2,
	"num_choices": 2,
	"sequence_length": 16
	},
	"new_tokens": null,
	"latency": true,
	"memory": true,
	"energy": false,
	"forward_kwargs": {},
	"generate_kwargs": {},
	"call_kwargs": {}
	},
	"experiment_name": "api-launch",
	"task": null,
	"model": null,
	"device": null,
	"library": null,
	"environment": {
	"cpu": " Intel(R) Xeon(R) Gold 6448Y",
	"cpu_count": 16,
	"cpu_ram_mb": 237491.42528,
	"system": "Linux",
	"machine": "x86_64",
	"platform": "Linux-5.15.0-86-generic-x86_64-with-glibc2.35",
	"processor": "x86_64",
	"python_version": "3.10.12",
	"gpu": [
	"NVIDIA H100 80GB HBM3"
	],
	"gpu_count": 1,
	"gpu_vram_mb": 85520809984,
	"optimum_benchmark_version": "0.2.0",
	"optimum_benchmark_commit": "9141f5b68a70cab5d9d5698b5bcefafd0c07270f",
	"transformers_version": "4.39.1",
	"transformers_commit": null,
	"accelerate_version": "0.25.0",
	"accelerate_commit": null,
	"diffusers_version": "0.15.0",
	"diffusers_commit": null,
	"optimum_version": "1.17.1",
	"optimum_commit": null,
	"timm_version": null,
	"timm_commit": null,
	"peft_version": "0.9.0",
	"peft_commit": null
	}
	}