Spaces:

Spico
/

Mirror

Runtime error

App Files Files Community

Mirror / conf /mirror-ace05en.yaml

Spico

update

5953ef9 over 1 year ago

raw

history blame contribute delete

2.34 kB

	# task
	task_type: SchemaGuidedInstructBertTask
	task_name: InstructBert_TagSpan_DebertaV3Base_ACE05ENPlus
	comment: '~~content as label, (start, end + 1) span'

	# data preprocessing
	max_seq_len: 512
	debug_mode: false
	label_span: tag # tag `[LM]` or content `person`
	mode: span # w2 (1,2,3) or span (1,3)

	# filepaths
	plm_dir: microsoft/deberta-v3-base
	# plm_dir: bert-base-cased
	# data_dir: resources/Mirror/Tasks/EE/ACE05-EN
	# data_dir: resources/Mirror/Tasks/RE/merged-20230502-2340-v1
	# data_dir: resources/Mirror/Tasks/RE/merged-20230502-2358-v2-woADE
	# data_dir: resources/Mirror/Tasks/EE/ACE05-EN-labelmap
	data_dir: resources/Mirror/v1.3/event/en/ACE05-EN-plus/fixed_instructed
	output_dir: outputs
	task_dir: ${output_dir}/${task_name}
	# train_filepath: ${data_dir}/ACE2005_plus_train.jsonl
	# dev_filepath: ${data_dir}/ACE2005_plus_dev.jsonl
	# test_filepath: ${data_dir}/ACE2005_plus_test.jsonl
	# train_filepath: ${data_dir}/ACE2005_oneie_NER_train.jsonl
	# dev_filepath: ${data_dir}/ACE2005_oneie_NER_dev.jsonl
	# test_filepath: ${data_dir}/ACE2005_oneie_NER_test.jsonl
	# train_filepath: ${data_dir}/ACE2005_oneie_RE_train.jsonl
	# dev_filepath: ${data_dir}/ACE2005_oneie_RE_dev.jsonl
	# test_filepath: ${data_dir}/ACE2005_oneie_RE_test.jsonl
	# train_filepath: ${data_dir}/ACE2005_oneie_EE_train.jsonl
	# dev_filepath: ${data_dir}/ACE2005_oneie_EE_dev.jsonl
	# test_filepath: ${data_dir}/ACE2005_oneie_EE_test.jsonl
	# train_filepath: ${data_dir}/ACE2005_oneie_train.jsonl
	# dev_filepath: ${data_dir}/ACE2005_oneie_dev.jsonl
	# test_filepath: ${data_dir}/ACE2005_oneie_test.jsonl
	# train_filepath: ${data_dir}/train.jsonl
	# dev_filepath: ${data_dir}/dev.jsonl
	# test_filepath: ${data_dir}/test.jsonl
	train_filepath: ${data_dir}/train.jsonl
	dev_filepath: ${data_dir}/dev.jsonl
	test_filepath: ${data_dir}/test.jsonl

	dump_cache_dir: ${task_dir}/cache
	regenerate_cache: false

	# training
	random_seed: 1227
	eval_on_data: [dev, test]
	select_best_on_data: dev
	select_best_by_key: metric
	best_metric_field: general_spans.micro.f1
	final_eval_on_test: true
	save_every_ckpt: false
	save_best_ckpt: true

	warmup_proportion: 0.1
	num_epochs: 50
	epoch_patience: 5
	train_batch_size: 32
	eval_batch_size: 32
	learning_rate: !!float 3e-5
	other_learning_rate: !!float 3e-5
	max_grad_norm: 1.0
	weight_decay: 0.1

	# model
	dropout: 0.3
	use_rope: true
	biaffine_size: 512