{ "model": { "model_name": "google-t5/t5-base", "max_input_length": 512, "max_target_length": 256, "vocab_size": 32128, "lora_r": 16, "lora_alpha": 32, "lora_dropout": 0.1, "target_modules": [ "q", "v", "k", "o", "wi_0", "wi_1", "wo" ] }, "training": { "output_dir": "./medical-qa-t5-lora", "num_train_epochs": 500, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 16, "gradient_accumulation_steps": 4, "learning_rate": 0.0005, "weight_decay": 0.01, "warmup_steps": 500, "max_steps": -1, "eval_steps": 50, "save_steps": 100, "logging_steps": 50, "evaluation_strategy": "steps", "save_strategy": "steps", "fp16": true, "dataloader_num_workers": 4, "remove_unused_columns": false, "load_best_model_at_end": true, "metric_for_best_model": "eval_loss", "greater_is_better": false, "report_to": "tensorboard", "logging_dir": "./logs", "max_grad_norm": 1.0, "seed": 42 }, "data": { "dataset_name": "keivalya/MedQuad-MedicalQnADataset", "train_split": "train", "validation_split": "validation", "test_split": "test", "question_prefix": "medical question: ", "answer_prefix": "medical answer: ", "max_samples": null, "remove_special_chars": true, "lowercase": false, "strip_whitespace": true }, "huggingface": { "hub_model_id": "Adilbai/medical-qa-t5-lora", "hub_token": null, "push_to_hub": true, "hub_private_repo": false, "save_base_model": true, "save_lora_adapter": true, "save_tokenizer": true, "save_config": true }, "device": "cuda", "cache_dir": "./cache", "data_dir": "./data" }