metadata
datasets:
- jasperyeoh2/pairrm-preference-dataset
- GAIR/lima
base_model:
- mistralai/Mistral-7B-Instruct-v0.2
tags:
- PEFT
- DPO
datasets:
- jasperyeoh2/pairrm-preference-dataset
- GAIR/lima
base_model:
- mistralai/Mistral-7B-Instruct-v0.2
tags:
- PEFT
- DPO