��:[�omegaconf.dictconfig�� DictConfig���)��}�(� _metadata��omegaconf.base��ContainerMetadata���)��}�(�ref_type��builtins��dict���� object_type�N�optional���key�N�flags�}��struct��s�resolver_cache�� collections�� defaultdict���h��R��key_type�N� element_type�Nub�_parent�N�_content�}�(�_name��omegaconf.nodes��AnyNode���)��}�(hh�Metadata���)��}�(h �typing��Any���hNh�hh h}�hhh��R�ubhh�_val�Nub�common�h)��}�(hh)��}�(h h,hNh�hh1h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhh2h0Nub�no_progress_bar�h#)��}�(hh')��}�(h h,hNh�hhAh}�hhh��R�ubhh2h0�ub� log_interval�h#)��}�(hh')��}�(h h,hNh�hhIh}�hhh��R�ubhh2h0Kdub� log_format�h#)��}�(hh')��}�(h h,hNh�hhQh}�hhh��R�ubhh2h0Nub�log_file�h#)��}�(hh')��}�(h h,hNh�hhYh}�hhh��R�ubhh2h0Nub�aim_repo�h#)��}�(hh')��}�(h h,hNh�hhah}�hhh��R�ubhh2h0Nub� aim_run_hash�h#)��}�(hh')��}�(h h,hNh�hhih}�hhh��R�ubhh2h0Nub�tensorboard_logdir�h#)��}�(hh')��}�(h h,hNh�hhqh}�hhh��R�ubhh2h0Nub� wandb_project�h#)��}�(hh')��}�(h h,hNh�hhyh}�hhh��R�ubhh2h0Nub�azureml_logging�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�seed�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0Kub�cpu�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�tpu�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�bf16�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�memory_efficient_bf16�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�fp16�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�memory_efficient_fp16�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�fp16_no_flatten_grads�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�fp16_init_scale�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0K�ub�fp16_scale_window�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0Nub�fp16_scale_tolerance�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0Gub�on_cpu_convert_precision�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�min_loss_scale�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0G?6��C-ub�threshold_loss_scale�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0Nub�amp�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhh2h0�ub�amp_batch_retries�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhh2h0Kub�amp_init_scale�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhh2h0K�ub�amp_scale_window�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhh2h0Nub�user_dir�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhh2h0�mcolt�ub�empty_cache_freq�h#)��}�(hh')��}�(h h,hNh�hj"h}�hhh��R�ubhh2h0Kub�all_gather_list_size�h#)��}�(hh')��}�(h h,hNh�hj*h}�hhh��R�ubhh2h0M@ub�model_parallel_size�h#)��}�(hh')��}�(h h,hNh�hj2h}�hhh��R�ubhh2h0Kub�quantization_config_path�h#)��}�(hh')��}�(h h,hNh�hj:h}�hhh��R�ubhh2h0Nub�profile�h#)��}�(hh')��}�(h h,hNh�hjBh}�hhh��R�ubhh2h0�ub� reset_logging�h#)��}�(hh')��}�(h h,hNh�hjJh}�hhh��R�ubhh2h0�ub�suppress_crashes�h#)��}�(hh')��}�(h h,hNh�hjRh}�hhh��R�ubhh2h0�ub�use_plasma_view�h#)��}�(hh')��}�(h h,hNh�hjZh}�hhh��R�ubhh2h0�ub� plasma_path�h#)��}�(hh')��}�(h h,hNh�hjbh}�hhh��R�ubhh2h0� /tmp/plasma�ubuub� common_eval�h)��}�(hh)��}�(h h,hNh�hjkh}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhjlh0Nub�path�h#)��}�(hh')��}�(h h,hNh�hj{h}�hhh��R�ubhjlh0�12e12d_last.pt�ub� post_process�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjlh0� subword_nmt�ub�quiet�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjlh0�ub�model_overrides�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjlh0�{}�ub� results_path�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjlh0Nubuub�distributed_training�h)��}�(hh)��}�(h h,hNh�hj�h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0Nub�distributed_world_size�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�distributed_num_procs�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�distributed_rank�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�distributed_backend�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�nccl�ub�distributed_init_method�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�distributed_port�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0J����ub� device_id�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�distributed_no_spawn�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub� ddp_backend�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0� pytorch_ddp�ub� ddp_comm_hook�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�none�ub� bucket_cap_mb�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0Kub�fix_batches_to_gpus�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�ub�find_unused_parameters�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�ub�gradient_as_bucket_view�h#)��}�(hh')��}�(h h,hNh�hj!h}�hhh��R�ubhj�h0�ub�fast_stat_sync�h#)��}�(hh')��}�(h h,hNh�hj)h}�hhh��R�ubhj�h0�ub�heartbeat_timeout�h#)��}�(hh')��}�(h h,hNh�hj1h}�hhh��R�ubhj�h0J����ub�broadcast_buffers�h#)��}�(hh')��}�(h h,hNh�hj9h}�hhh��R�ubhj�h0�ub�slowmo_momentum�h#)��}�(hh')��}�(h h,hNh�hjAh}�hhh��R�ubhj�h0Nub�slowmo_base_algorithm�h#)��}�(hh')��}�(h h,hNh�hjIh}�hhh��R�ubhj�h0�localsgd�ub�localsgd_frequency�h#)��}�(hh')��}�(h h,hNh�hjRh}�hhh��R�ubhj�h0Kub�nprocs_per_node�h#)��}�(hh')��}�(h h,hNh�hjZh}�hhh��R�ubhj�h0Kub�pipeline_model_parallel�h#)��}�(hh')��}�(h h,hNh�hjbh}�hhh��R�ubhj�h0�ub�pipeline_balance�h#)��}�(hh')��}�(h h,hNh�hjjh}�hhh��R�ubhj�h0Nub�pipeline_devices�h#)��}�(hh')��}�(h h,hNh�hjrh}�hhh��R�ubhj�h0Nub�pipeline_chunks�h#)��}�(hh')��}�(h h,hNh�hjzh}�hhh��R�ubhj�h0Kub�pipeline_encoder_balance�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�pipeline_encoder_devices�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�pipeline_decoder_balance�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�pipeline_decoder_devices�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�pipeline_checkpoint�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�never�ub� zero_sharding�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0jubh�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhj�h0�ubh�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhj�h0�ubh�h#)��}�(hh')��}�(h h,hNh�hh�h}�hhh��R�ubhj�h0�ub�no_reshard_after_forward�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�fp32_reduce_scatter�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub� cpu_offload�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�use_sharded_state�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�not_fsdp_flatten_parameters�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ubuub�dataset�h)��}�(hh)��}�(h h,hNh�hj�h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0Nub� num_workers�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Kub�#skip_invalid_size_inputs_valid_test�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�ub� max_tokens�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Mub� batch_size�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Nub�required_batch_size_multiple�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0Kub�required_seq_len_multiple�h#)��}�(hh')��}�(h h,hNh�hj(h}�hhh��R�ubhj�h0Kub� dataset_impl�h#)��}�(hh')��}�(h h,hNh�hj0h}�hhh��R�ubhj�h0Nub�data_buffer_size�h#)��}�(hh')��}�(h h,hNh�hj8h}�hhh��R�ubhj�h0K ub� train_subset�h#)��}�(hh')��}�(h h,hNh�hj@h}�hhh��R�ubhj�h0�train�ub� valid_subset�h#)��}�(hh')��}�(h h,hNh�hjIh}�hhh��R�ubhj�h0�valid�ub�combine_valid_subsets�h#)��}�(hh')��}�(h h,hNh�hjRh}�hhh��R�ubhj�h0Nub�ignore_unused_valid_subsets�h#)��}�(hh')��}�(h h,hNh�hjZh}�hhh��R�ubhj�h0�ub�validate_interval�h#)��}�(hh')��}�(h h,hNh�hjbh}�hhh��R�ubhj�h0Kub�validate_interval_updates�h#)��}�(hh')��}�(h h,hNh�hjjh}�hhh��R�ubhj�h0Kub�validate_after_updates�h#)��}�(hh')��}�(h h,hNh�hjrh}�hhh��R�ubhj�h0Kub�fixed_validation_seed�h#)��}�(hh')��}�(h h,hNh�hjzh}�hhh��R�ubhj�h0Nub�disable_validation�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�max_tokens_valid�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Mub�batch_size_valid�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�max_valid_steps�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub� curriculum�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub� gen_subset�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�test�ub� num_shards�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�shard_id�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�grouped_shuffling�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�update_epoch_batch_itr�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�update_ordered_indices_seed�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ubuub� optimization�h)��}�(hh)��}�(h h,hNh�hj�h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0Nub� max_epoch�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub� max_update�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�stop_time_hours�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Gub� clip_norm�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Gub� sentence_avg�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0�ub� update_freq��omegaconf.listconfig�� ListConfig���)��}�(hh)��}�(h h,hh �list���h�hjh}�hhh��R�hh �int���hNubhj�h]�h#)��}�(hh')��}�(h h,hNh�hKh}�hhh��R�ubhjh0Kubaub�lr�j)��}�(hh)��}�(h h,hjh�hj*h}�hhh��R�hj!hNubhj�h]�h#)��}�(hh')��}�(h h,hNh�hKh}�hhh��R�ubhj+h0G?�ubaub� stop_min_lr�h#)��}�(hh')��}�(h h,hNh�hj:h}�hhh��R�ubhj�h0G��ub�use_bmuf�h#)��}�(hh')��}�(h h,hNh�hjBh}�hhh��R�ubhj�h0�ub�skip_remainder_batch�h#)��}�(hh')��}�(h h,hNh�hjJh}�hhh��R�ubhj�h0�ub�debug_param_names�h#)��}�(hh')��}�(h h,hNh�hjRh}�hhh��R�ubhj�h0�ubuub� checkpoint�h)��}�(hh)��}�(h h,hNh�hjZh}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj[h0Nub�save_dir�h#)��}�(hh')��}�(h h,hNh�hjjh}�hhh��R�ubhj[h0� checkpoints�ub� restore_file�h#)��}�(hh')��}�(h h,hNh�hjsh}�hhh��R�ubhj[h0�checkpoint_last.pt�ub� continue_once�h#)��}�(hh')��}�(h h,hNh�hj|h}�hhh��R�ubhj[h0Nub�finetune_from_model�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0Nub�reset_dataloader�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�reset_lr_scheduler�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub� reset_meters�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�reset_optimizer�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�optimizer_overrides�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�{}�ub� save_interval�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0Kub�save_interval_updates�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0Kub�keep_interval_updates�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0J����ub�keep_interval_updates_pattern�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0J����ub�keep_last_epochs�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0J����ub�keep_best_checkpoints�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0J����ub�no_save�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�no_epoch_checkpoints�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�no_last_checkpoints�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�no_save_optimizer_state�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj[h0�ub�best_checkpoint_metric�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj[h0�loss�ub�maximize_best_checkpoint_metric�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj[h0�ub�patience�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj[h0J����ub�checkpoint_suffix�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj[h0��ub�checkpoint_shard_count�h#)��}�(hh')��}�(h h,hNh�hj'h}�hhh��R�ubhj[h0Kub�load_checkpoint_on_all_dp_ranks�h#)��}�(hh')��}�(h h,hNh�hj/h}�hhh��R�ubhj[h0�ub� write_checkpoints_asynchronously�h#)��}�(hh')��}�(h h,hNh�hj7h}�hhh��R�ubhj[h0�ubj2h#)��}�(hh')��}�(h h,hNh�hj2h}�hhh��R�ubhj[h0Kubuub�bmuf�h)��}�(hh)��}�(h h,hNh�hjFh}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhjGh0Nub�block_lr�h#)��}�(hh')��}�(h h,hNh�hjVh}�hhh��R�ubhjGh0G?�ub�block_momentum�h#)��}�(hh')��}�(h h,hNh�hj^h}�hhh��R�ubhjGh0G?�ub�global_sync_iter�h#)��}�(hh')��}�(h h,hNh�hjfh}�hhh��R�ubhjGh0K2ub�warmup_iterations�h#)��}�(hh')��}�(h h,hNh�hjnh}�hhh��R�ubhjGh0M�ub�use_nbm�h#)��}�(hh')��}�(h h,hNh�hjvh}�hhh��R�ubhjGh0�ub� average_sync�h#)��}�(hh')��}�(h h,hNh�hj~h}�hhh��R�ubhjGh0�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjGh0Kubuub� generation�h)��}�(hh)��}�(h h,hNh�hj�h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0Nub�beam�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�beam_mt�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�nbest�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub� max_len_a�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Gub� max_len_b�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0K�ub� max_len_a_mt�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Gub� max_len_b_mt�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0K�ub�min_len�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�match_source_len�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub� unnormalized�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub� no_early_stop�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�no_beamable_mm�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�lenpen�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0G?�ub� lenpen_mt�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0G?�ub�unkpen�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0Gub� replace_unk�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Nub� sacrebleu�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�ub�score_reference�h#)��}�(hh')��}�(h h,hNh�hj%h}�hhh��R�ubhj�h0�ub� prefix_size�h#)��}�(hh')��}�(h h,hNh�hj-h}�hhh��R�ubhj�h0Kub�no_repeat_ngram_size�h#)��}�(hh')��}�(h h,hNh�hj5h}�hhh��R�ubhj�h0Kub�sampling�h#)��}�(hh')��}�(h h,hNh�hj=h}�hhh��R�ubhj�h0�ub� sampling_topk�h#)��}�(hh')��}�(h h,hNh�hjEh}�hhh��R�ubhj�h0J����ub� sampling_topp�h#)��}�(hh')��}�(h h,hNh�hjMh}�hhh��R�ubhj�h0G��ub� constraints�h#)��}�(hh')��}�(h h,hNh�hjUh}�hhh��R�ubhj�h0Nub� temperature�h#)��}�(hh')��}�(h h,hNh�hj]h}�hhh��R�ubhj�h0G?�ub�diverse_beam_groups�h#)��}�(hh')��}�(h h,hNh�hjeh}�hhh��R�ubhj�h0J����ub�diverse_beam_strength�h#)��}�(hh')��}�(h h,hNh�hjmh}�hhh��R�ubhj�h0G?�ub�diversity_rate�h#)��}�(hh')��}�(h h,hNh�hjuh}�hhh��R�ubhj�h0G��ub�print_alignment�h#)��}�(hh')��}�(h h,hNh�hj}h}�hhh��R�ubhj�h0Nub� print_step�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�lm_path�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub� lm_weight�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Gub�iter_decode_eos_penalty�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Gub�iter_decode_max_iter�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0K ub�iter_decode_force_max_iter�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�iter_decode_with_beam�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kub�"iter_decode_with_external_reranker�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�retain_iter_history�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�retain_dropout�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub�retain_dropout_modules�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�decoding_format�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nub�no_seed_provided�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0�ub� eos_token�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nubuub�eval_lm�h)��}�(hh)��}�(h h,hNh�hj�h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0Nub�output_word_probs�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0�ub�output_word_stats�h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0�ub�context_window�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0Kub� softmax_batch�h#)��}�(hh')��}�(h h,hNh�hjh}�hhh��R�ubhj�h0��������ubuub� interactive�h)��}�(hh)��}�(h h,hNh�hj%h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj&h0Nub� buffer_size�h#)��}�(hh')��}�(h h,hNh�hj5h}�hhh��R�ubhj&h0Kub�input�h#)��}�(hh')��}�(h h,hNh�hj=h}�hhh��R�ubhj&h0�input.en�ubuub�model�h#)��}�(hh')��}�(h h,hNh�hjFh}�hhh��R�ubhhh0Nub�task�h#)��}�(hh')��}�(h h,hNh�hjNh}�hhh��R�ubhhh0�argparse�� Namespace���)��}�(hA�hIKdhQNhYNhaNhiNhqNhyNh��h�Kh��h��h��h��h��h��h��h�K�h�Nh�Gh�h�G?6��C-h�Nh��jKj K�jNj�mcolt�j"Kj*M@j2Kj:NjB�jJ�jR�jZ�jb� /tmp/plasma�� criterion�� cross_entropy�� tokenizer��moses��bpe�� subword_nmt�� optimizer�N� lr_scheduler��fixed��scoring��bleu�jN�translation_w_langtok�jKj�jMjNj Kj(Kj0Nj8K j@�train�jI�valid�jRNjZ�jbKjjKjrKjzNj��j�Mj�Nj�Nj�Kj��test�j�Kj�Kj��j��j��j�Kj�Kj�Kj��nccl�j�Nj�J����j�Kj��j�j�jjj Kj�j�j!�j)�j1J����j9�jANjI�localsgd�jRKjZKjb�jjNjrNjzKj�Nj�Nj�Nj�Nj�j�j�jj��j��j��j��j��j{�12e12d_last.pt�j�� subword_nmt�j��j��{}�j�Nj�Kj�Kj�Kj�Kj�K�j�Kj�K�j�Kj��j��j��j��j�KjKj KjNj�j%�j-Kj5Kj=�jEJ����jMG��jUNj]G?�jeJ����jmG?�juG��j}Nj��j�Nj�Gj�Gj�K j��j�Kj��j��j��j�Nj�Nj��j�Njj� checkpoints�js�checkpoint_last.pt�j|Nj�Nj��j��j��j��j�jpj�Kj�Kj�J����j�J����j�J����j�J����j��j��j��j��j�loss�j�jJ����jj&j'Kj/�j7�j5Kj=�input.en��data�� ./data-bin�� source_lang��zh�� target_lang��en��load_alignments���left_pad_source��True��left_pad_target��False��max_source_positions�M�max_target_positions�M�upsample_primary�K�truncate_source���num_batch_buckets�K�lang_prefix_tok�� LANG_TOK_ES�� eval_bleu���eval_bleu_detok��space��eval_bleu_detok_args�N�eval_tokenized_bleu���eval_bleu_remove_bpe�N�eval_bleu_args�N�eval_bleu_print_samples���moses_no_dash_splits���moses_no_escape��� bpe_codes��codes.bpe.32000�� bpe_separator��@@�� force_anneal�N� lr_shrink�G?��������warmup_updates�K�pad�K�eos�K�unk�Kh jhububj]h)��}�(hh)��}�(h h,hNh�hj]h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0� cross_entropy�ubj h#)��}�(hh')��}�(h h,hNh�hj h}�hhh��R�ubhj�h0�ubuubjch#)��}�(hh')��}�(h h,hNh�hjch}�hhh��R�ubhhh0Nubjdh)��}�(hh)��}�(h h,hNh�hjdh}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0�fixed�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Nubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0G?�������ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kubj*j)��}�(hh)��}�(h h,hjh�hj*h}�hhh��R�hj!hNubhj�h]�h#)��}�(hh')��}�(h h,hNh�hKh}�hhh��R�ubhj�h0G?�ubaubuubjfh)��}�(hh)��}�(h h,hNh�hjfh}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj�h0�bleu�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj�h0Kubuubjah)��}�(hh)��}�(h h,hNh�hjah}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhjh0� subword_nmt�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjh0�codes.bpe.32000�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjh0�@@�ubuubj_h)��}�(hh)��}�(h h,hNh�hj_h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhj2h0�moses�ubjwh#)��}�(hh')��}�(h h,hNh�hjwh}�hhh��R�ubhj2h0�zh�ubjyh#)��}�(hh')��}�(h h,hNh�hjyh}�hhh��R�ubhj2h0�en�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj2h0�ubj�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhj2h0�ubuub�ema�h)��}�(hh)��}�(h h,hNh�hj`h}�hhh��R�hNhNubhhh}�(h h#)��}�(hh')��}�(h h,hNh�hh h}�hhh��R�ubhjah0Nub� store_ema�h#)��}�(hh')��}�(h h,hNh�hjph}�hhh��R�ubhjah0�ub� ema_decay�h#)��}�(hh')��}�(h h,hNh�hjxh}�hhh��R�ubhjah0G?��.H�ub�ema_start_update�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjah0Kub�ema_seed_model�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjah0Nub�ema_update_freq�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjah0Kub�ema_fp32�h#)��}�(hh')��}�(h h,hNh�hj�h}�hhh��R�ubhjah0�ubuubuub.