# task | |
task_type: SchemaGuidedInstructBertTask | |
task_name: InstructBert_TagSpan_DebertaV3Base_ACE05ENPlus | |
comment: '~~content as label, (start, end + 1) span' | |
# data preprocessing | |
max_seq_len: 512 | |
debug_mode: false | |
label_span: tag # tag `[LM]` or content `person` | |
mode: span # w2 (1,2,3) or span (1,3) | |
# filepaths | |
plm_dir: microsoft/deberta-v3-base | |
# plm_dir: bert-base-cased | |
# data_dir: resources/Mirror/Tasks/EE/ACE05-EN | |
# data_dir: resources/Mirror/Tasks/RE/merged-20230502-2340-v1 | |
# data_dir: resources/Mirror/Tasks/RE/merged-20230502-2358-v2-woADE | |
# data_dir: resources/Mirror/Tasks/EE/ACE05-EN-labelmap | |
data_dir: resources/Mirror/v1.3/event/en/ACE05-EN-plus/fixed_instructed | |
output_dir: outputs | |
task_dir: ${output_dir}/${task_name} | |
# train_filepath: ${data_dir}/ACE2005_plus_train.jsonl | |
# dev_filepath: ${data_dir}/ACE2005_plus_dev.jsonl | |
# test_filepath: ${data_dir}/ACE2005_plus_test.jsonl | |
# train_filepath: ${data_dir}/ACE2005_oneie_NER_train.jsonl | |
# dev_filepath: ${data_dir}/ACE2005_oneie_NER_dev.jsonl | |
# test_filepath: ${data_dir}/ACE2005_oneie_NER_test.jsonl | |
# train_filepath: ${data_dir}/ACE2005_oneie_RE_train.jsonl | |
# dev_filepath: ${data_dir}/ACE2005_oneie_RE_dev.jsonl | |
# test_filepath: ${data_dir}/ACE2005_oneie_RE_test.jsonl | |
# train_filepath: ${data_dir}/ACE2005_oneie_EE_train.jsonl | |
# dev_filepath: ${data_dir}/ACE2005_oneie_EE_dev.jsonl | |
# test_filepath: ${data_dir}/ACE2005_oneie_EE_test.jsonl | |
# train_filepath: ${data_dir}/ACE2005_oneie_train.jsonl | |
# dev_filepath: ${data_dir}/ACE2005_oneie_dev.jsonl | |
# test_filepath: ${data_dir}/ACE2005_oneie_test.jsonl | |
# train_filepath: ${data_dir}/train.jsonl | |
# dev_filepath: ${data_dir}/dev.jsonl | |
# test_filepath: ${data_dir}/test.jsonl | |
train_filepath: ${data_dir}/train.jsonl | |
dev_filepath: ${data_dir}/dev.jsonl | |
test_filepath: ${data_dir}/test.jsonl | |
dump_cache_dir: ${task_dir}/cache | |
regenerate_cache: false | |
# training | |
random_seed: 1227 | |
eval_on_data: [dev, test] | |
select_best_on_data: dev | |
select_best_by_key: metric | |
best_metric_field: general_spans.micro.f1 | |
final_eval_on_test: true | |
save_every_ckpt: false | |
save_best_ckpt: true | |
warmup_proportion: 0.1 | |
num_epochs: 50 | |
epoch_patience: 5 | |
train_batch_size: 32 | |
eval_batch_size: 32 | |
learning_rate: !!float 3e-5 | |
other_learning_rate: !!float 3e-5 | |
max_grad_norm: 1.0 | |
weight_decay: 0.1 | |
# model | |
dropout: 0.3 | |
use_rope: true | |
biaffine_size: 512 | |