kushal-tri
/

sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_

kushal-tri commited on Nov 13, 2024

Commit

72cc66a

verified ·

1 Parent(s): 88fe4a9

Training in progress, epoch 0

Browse files

Files changed (27) hide show

.gitattributes +1 -0
added_tokens.json +30 -0
config.json +29 -0
merges.txt +0 -0
model-00001-of-00004.safetensors +3 -0
model-00002-of-00004.safetensors +3 -0
model-00003-of-00004.safetensors +3 -0
model-00004-of-00004.safetensors +3 -0
model.safetensors.index.json +346 -0
special_tokens_map.json +60 -0
tokenizer.json +3 -0
tokenizer_config.json +248 -0
training_args.bin +3 -0
vocab.json +0 -0
wandb/debug-internal.log +373 -0
wandb/debug.log +30 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training/sft.py +249 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml +515 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml +948 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch +49 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log +0 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/requirements.txt +289 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-metadata.json +1069 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json +1 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug-internal.log +373 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug.log +30 -0
wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/run-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1.wandb +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

added_tokens.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "</tool_call>": 151658,
+  "<tool_call>": 151657,
+  "<|box_end|>": 151649,
+  "<|box_start|>": 151648,
+  "<|endoftext|>": 151643,
+  "<|file_sep|>": 151664,
+  "<|fim_middle|>": 151660,
+  "<|fim_pad|>": 151662,
+  "<|fim_prefix|>": 151659,
+  "<|fim_suffix|>": 151661,
+  "<|im_end|>": 151645,
+  "<|im_start|>": 151644,
+  "<|image_pad|>": 151655,
+  "<|object_ref_end|>": 151647,
+  "<|object_ref_start|>": 151646,
+  "<|quad_end|>": 151651,
+  "<|quad_start|>": 151650,
+  "<|repo_name|>": 151663,
+  "<|video_pad|>": 151656,
+  "<|vision_end|>": 151653,
+  "<|vision_pad|>": 151654,
+  "<|vision_start|>": 151652,
+  "[/REVISION]": 151670,
+  "[/STEP]": 151666,
+  "[/TURN]": 151668,
+  "[REVISION]": 151669,
+  "[STEP]": 151665,
+  "[TURN]": 151667
+}

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "Qwen/Qwen2.5-Coder-7B-Instruct",
+  "architectures": [
+    "Qwen2ForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 3584,
+  "initializer_range": 0.02,
+  "intermediate_size": 18944,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2",
+  "num_attention_heads": 28,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 4,
+  "pad_token_id": 151643,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
+  "rope_theta": 1000000.0,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.46.0",
+  "use_cache": false,
+  "use_sliding_window": false,
+  "vocab_size": 151671
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model-00001-of-00004.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5248e85868cfadf673f21aff3553bda95fc725be514fcb518f8605431cda1370
+size 4874843752

model-00002-of-00004.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:adaaf154d498e47b508bd058351d88fae666bd6923ef97752791cecf35f1a5ad
+size 4932751008

model-00003-of-00004.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:deaded19ac2798595b85aa83a5b121de1ccb598159e52f793d41caeb5ee6bee0
+size 4330865200

model-00004-of-00004.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:813e96187ef9e2dec23fdf90b62ac1ae750a434b9a0e73cd0847ce4b79035f8a
+size 1087177856

model.safetensors.index.json ADDED Viewed

	@@ -0,0 +1,346 @@

+{
+  "metadata": {
+    "total_size": 15225598976
+  },
+  "weight_map": {
+    "lm_head.weight": "model-00004-of-00004.safetensors",
+    "model.embed_tokens.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.18.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.18.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.19.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.19.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.20.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.20.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.21.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.22.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.k_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.q_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.v_proj.bias": "model-00003-of-00004.safetensors",
+    "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors",
+    "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.8.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.8.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.8.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.8.self_attn.k_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.q_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.v_proj.bias": "model-00001-of-00004.safetensors",
+    "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors",
+    "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.k_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.q_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.v_proj.bias": "model-00002-of-00004.safetensors",
+    "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors",
+    "model.norm.weight": "model-00003-of-00004.safetensors"
+  }
+}

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,60 @@

+{
+  "additional_special_tokens": [
+    {
+      "content": "[STEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[/STEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[TURN]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[/TURN]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[REVISION]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "[/REVISION]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
+  ],
+  "eos_token": {
+    "content": "<|im_end|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:119474abe8593f47402f00c90e22eac0436e64f8c84c8270309a27e152901418
+size 11423104

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,248 @@

+{
+  "add_bos_token": false,
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "151643": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151644": {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151645": {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151646": {
+      "content": "<|object_ref_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151647": {
+      "content": "<|object_ref_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151648": {
+      "content": "<|box_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151649": {
+      "content": "<|box_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151650": {
+      "content": "<|quad_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151651": {
+      "content": "<|quad_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151652": {
+      "content": "<|vision_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151653": {
+      "content": "<|vision_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151654": {
+      "content": "<|vision_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151655": {
+      "content": "<|image_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151656": {
+      "content": "<|video_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151657": {
+      "content": "<tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151658": {
+      "content": "</tool_call>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151659": {
+      "content": "<|fim_prefix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151660": {
+      "content": "<|fim_middle|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151661": {
+      "content": "<|fim_suffix|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151662": {
+      "content": "<|fim_pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151663": {
+      "content": "<|repo_name|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151664": {
+      "content": "<|file_sep|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    },
+    "151665": {
+      "content": "[STEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151666": {
+      "content": "[/STEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151667": {
+      "content": "[TURN]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151668": {
+      "content": "[/TURN]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151669": {
+      "content": "[REVISION]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "151670": {
+      "content": "[/REVISION]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [
+    "[STEP]",
+    "[/STEP]",
+    "[TURN]",
+    "[/TURN]",
+    "[REVISION]",
+    "[/REVISION]"
+  ],
+  "bos_token": null,
+  "chat_template": "{%- if tools %}\n    {{- '<|im_start|>system\\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] }}\n    {%- else %}\n        {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n    {%- endif %}\n    {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within <tools></tools> XML tags:\\n<tools>\" }}\n    {%- for tool in tools %}\n        {{- \"\\n\" }}\n        {{- tool | tojson }}\n    {%- endfor %}\n    {{- \"\\n</tools>\\n\\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\\n<tool_call>\\n{\\\"name\\\": <function-name>, \\\"arguments\\\": <args-json-object>}\\n</tool_call><|im_end|>\\n\" }}\n{%- else %}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n        {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role }}\n        {%- if message.content %}\n            {{- '\\n' + message.content }}\n        {%- endif %}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '\\n<tool_call>\\n{\"name\": \"' }}\n            {{- tool_call.name }}\n            {{- '\", \"arguments\": ' }}\n            {{- tool_call.arguments | tojson }}\n            {{- '}\\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n            {{- '<|im_start|>user' }}\n        {%- endif %}\n        {{- '\\n<tool_response>\\n' }}\n        {{- message.content }}\n        {{- '\\n</tool_response>' }}\n        {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n            {{- '<|im_end|>\\n' }}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "model_max_length": 131072,
+  "pad_token": "<|endoftext|>",
+  "split_special_tokens": false,
+  "tokenizer_class": "Qwen2Tokenizer",
+  "unk_token": null
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e9f4839aff554be94540be3a42c12da267eabc09f76854c83c125032ed378c31
+size 6328

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/debug-internal.log ADDED Viewed

	@@ -0,0 +1,373 @@

+2024-11-13 17:10:07,434 INFO    StreamThr :1939 [internal.py:wandb_internal():86] W&B internal server running at pid: 1939, started at: 2024-11-13 17:10:07.433254
+2024-11-13 17:10:07,435 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status
+2024-11-13 17:10:07,436 INFO    WriterThread:1939 [datastore.py:open_for_write():87] open: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/run-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1.wandb
+2024-11-13 17:10:07,437 DEBUG   SenderThread:1939 [sender.py:send():382] send: header
+2024-11-13 17:10:07,443 DEBUG   SenderThread:1939 [sender.py:send():382] send: run
+2024-11-13 17:10:07,751 INFO    SenderThread:1939 [dir_watcher.py:__init__():211] watching files in: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files
+2024-11-13 17:10:07,751 INFO    SenderThread:1939 [sender.py:_start_run_threads():1136] run started: kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1 with start time 1731517807.43302
+2024-11-13 17:10:07,759 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: check_version
+2024-11-13 17:10:07,760 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: check_version
+2024-11-13 17:10:07,839 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: run_start
+2024-11-13 17:10:07,929 DEBUG   HandlerThread:1939 [system_info.py:__init__():27] System info init
+2024-11-13 17:10:07,929 DEBUG   HandlerThread:1939 [system_info.py:__init__():42] System info init done
+2024-11-13 17:10:07,929 INFO    HandlerThread:1939 [system_monitor.py:start():194] Starting system monitor
+2024-11-13 17:10:07,929 INFO    SystemMonitor:1939 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-11-13 17:10:07,930 INFO    HandlerThread:1939 [system_monitor.py:probe():214] Collecting system info
+2024-11-13 17:10:07,930 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started cpu monitoring
+2024-11-13 17:10:07,931 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started disk monitoring
+2024-11-13 17:10:07,932 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started gpu monitoring
+2024-11-13 17:10:07,933 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started memory monitoring
+2024-11-13 17:10:07,933 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started network monitoring
+2024-11-13 17:10:07,993 DEBUG   HandlerThread:1939 [system_info.py:probe():151] Probing system
+2024-11-13 17:10:07,996 DEBUG   HandlerThread:1939 [system_info.py:_probe_git():136] Probing git
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_info.py:_probe_git():144] Probing git done
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_info.py:probe():199] Probing system done
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_monitor.py:probe():223] {'os': 'Linux-5.10.226-214.879.amzn2.x86_64-x86_64-with-glibc2.31', 'python': '3.10.12', 'heartbeatAt': '2024-11-13T17:10:07.993791', 'startedAt': '2024-11-13T17:10:07.428221', 'docker': None, 'cuda': None, 'args': ('--batch_size', '64', '--cache_dir', '/opt/ml/data/input/.cache', '--dataset', 'code-contests', '--gradient_accumulation_steps', '8', '--logging_steps', '5', '--lr', '1e-5', '--max_seq_length', '2048', '--model_name', 'Qwen/Qwen2.5-Coder-7B-Instruct', '--num_train_epochs', '2', '--output_dir', '/opt/ml/model/', '--push_to_hub', 'True', '--run_name', 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', '--save_steps', '100', '--schedule', 'cosine', '--wandb_project', 'sft-codecontests-1112', '--weight_decay', '0.0'), 'state': 'running', 'program': '/opt/ml/code/qlearning_reasoning/training/sft.py', 'codePathLocal': 'qlearning_reasoning/training/sft.py', 'codePath': 'qlearning_reasoning/training/sft.py', 'git': {'remote': '[email protected]:TRI-ML/reasoning-value-verifiers.git', 'commit': 'cbfd05147f15c55be83f4996eebdb305c17f119d'}, 'email': None, 'root': '/opt/ml/code', 'host': 'algo-1', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 96, 'cpu_count_logical': 192, 'cpu_freq': {'current': 2807.4830677083337, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 3476.342, 'min': 0.0, 'max': 0.0}, {'current': 3247.882, 'min': 0.0, 'max': 0.0}, {'current': 2904.031, 'min': 0.0, 'max': 0.0}, {'current': 3109.433, 'min': 0.0, 'max': 0.0}, {'current': 3599.377, 'min': 0.0, 'max': 0.0}, {'current': 3103.902, 'min': 0.0, 'max': 0.0}, {'current': 3160.704, 'min': 0.0, 'max': 0.0}, {'current': 2903.061, 'min': 0.0, 'max': 0.0}, {'current': 3151.516, 'min': 0.0, 'max': 0.0}, {'current': 3220.914, 'min': 0.0, 'max': 0.0}, {'current': 3113.9, 'min': 0.0, 'max': 0.0}, {'current': 3599.288, 'min': 0.0, 'max': 0.0}, {'current': 3149.924, 'min': 0.0, 'max': 0.0}, {'current': 3195.68, 'min': 0.0, 'max': 0.0}, {'current': 3273.352, 'min': 0.0, 'max': 0.0}, {'current': 3152.916, 'min': 0.0, 'max': 0.0}, {'current': 2940.821, 'min': 0.0, 'max': 0.0}, {'current': 2997.447, 'min': 0.0, 'max': 0.0}, {'current': 2722.682, 'min': 0.0, 'max': 0.0}, {'current': 2960.205, 'min': 0.0, 'max': 0.0}, {'current': 3014.718, 'min': 0.0, 'max': 0.0}, {'current': 2865.342, 'min': 0.0, 'max': 0.0}, {'current': 2643.892, 'min': 0.0, 'max': 0.0}, {'current': 2626.179, 'min': 0.0, 'max': 0.0}, {'current': 3181.377, 'min': 0.0, 'max': 0.0}, {'current': 3271.231, 'min': 0.0, 'max': 0.0}, {'current': 3187.187, 'min': 0.0, 'max': 0.0}, {'current': 3199.812, 'min': 0.0, 'max': 0.0}, {'current': 3207.165, 'min': 0.0, 'max': 0.0}, {'current': 3251.62, 'min': 0.0, 'max': 0.0}, {'current': 3597.089, 'min': 0.0, 'max': 0.0}, {'current': 3222.446, 'min': 0.0, 'max': 0.0}, {'current': 3597.008, 'min': 0.0, 'max': 0.0}, {'current': 3199.923, 'min': 0.0, 'max': 0.0}, {'current': 3328.709, 'min': 0.0, 'max': 0.0}, {'current': 3189.821, 'min': 0.0, 'max': 0.0}, {'current': 3176.968, 'min': 0.0, 'max': 0.0}, {'current': 3170.487, 'min': 0.0, 'max': 0.0}, {'current': 3186.086, 'min': 0.0, 'max': 0.0}, {'current': 3216.688, 'min': 0.0, 'max': 0.0}, {'current': 3594.347, 'min': 0.0, 'max': 0.0}, {'current': 3039.479, 'min': 0.0, 'max': 0.0}, {'current': 3486.888, 'min': 0.0, 'max': 0.0}, {'current': 3343.804, 'min': 0.0, 'max': 0.0}, {'current': 3238.757, 'min': 0.0, 'max': 0.0}, {'current': 2966.737, 'min': 0.0, 'max': 0.0}, {'current': 3348.466, 'min': 0.0, 'max': 0.0}, {'current': 2907.859, 'min': 0.0, 'max': 0.0}, {'current': 3002.238, 'min': 0.0, 'max': 0.0}, {'current': 2217.1, 'min': 0.0, 'max': 0.0}, {'current': 2241.607, 'min': 0.0, 'max': 0.0}, {'current': 2684.27, 'min': 0.0, 'max': 0.0}, {'current': 2719.247, 'min': 0.0, 'max': 0.0}, {'current': 2783.971, 'min': 0.0, 'max': 0.0}, {'current': 2773.016, 'min': 0.0, 'max': 0.0}, {'current': 3086.799, 'min': 0.0, 'max': 0.0}, {'current': 2611.966, 'min': 0.0, 'max': 0.0}, {'current': 2540.393, 'min': 0.0, 'max': 0.0}, {'current': 2541.301, 'min': 0.0, 'max': 0.0}, {'current': 2543.134, 'min': 0.0, 'max': 0.0}, {'current': 1889.373, 'min': 0.0, 'max': 0.0}, {'current': 2536.698, 'min': 0.0, 'max': 0.0}, {'current': 1960.209, 'min': 0.0, 'max': 0.0}, {'current': 1871.901, 'min': 0.0, 'max': 0.0}, {'current': 2935.658, 'min': 0.0, 'max': 0.0}, {'current': 2920.588, 'min': 0.0, 'max': 0.0}, {'current': 3597.066, 'min': 0.0, 'max': 0.0}, {'current': 3324.97, 'min': 0.0, 'max': 0.0}, {'current': 3298.432, 'min': 0.0, 'max': 0.0}, {'current': 3404.565, 'min': 0.0, 'max': 0.0}, {'current': 2925.92, 'min': 0.0, 'max': 0.0}, {'current': 3278.833, 'min': 0.0, 'max': 0.0}, {'current': 2607.119, 'min': 0.0, 'max': 0.0}, {'current': 1884.144, 'min': 0.0, 'max': 0.0}, {'current': 2516.733, 'min': 0.0, 'max': 0.0}, {'current': 1885.068, 'min': 0.0, 'max': 0.0}, {'current': 1881.651, 'min': 0.0, 'max': 0.0}, {'current': 2500.279, 'min': 0.0, 'max': 0.0}, {'current': 2519.44, 'min': 0.0, 'max': 0.0}, {'current': 2497.886, 'min': 0.0, 'max': 0.0}, {'current': 3376.996, 'min': 0.0, 'max': 0.0}, {'current': 3262.597, 'min': 0.0, 'max': 0.0}, {'current': 3258.462, 'min': 0.0, 'max': 0.0}, {'current': 3243.917, 'min': 0.0, 'max': 0.0}, {'current': 3263.253, 'min': 0.0, 'max': 0.0}, {'current': 3596.819, 'min': 0.0, 'max': 0.0}, {'current': 3251.877, 'min': 0.0, 'max': 0.0}, {'current': 3453.493, 'min': 0.0, 'max': 0.0}, {'current': 3597.538, 'min': 0.0, 'max': 0.0}, {'current': 3252.456, 'min': 0.0, 'max': 0.0}, {'current': 3235.472, 'min': 0.0, 'max': 0.0}, {'current': 3258.914, 'min': 0.0, 'max': 0.0}, {'current': 3221.932, 'min': 0.0, 'max': 0.0}, {'current': 3223.056, 'min': 0.0, 'max': 0.0}, {'current': 2916.257, 'min': 0.0, 'max': 0.0}, {'current': 3221.381, 'min': 0.0, 'max': 0.0}, {'current': 3249.041, 'min': 0.0, 'max': 0.0}, {'current': 3158.094, 'min': 0.0, 'max': 0.0}, {'current': 3117.532, 'min': 0.0, 'max': 0.0}, {'current': 3180.319, 'min': 0.0, 'max': 0.0}, {'current': 3597.35, 'min': 0.0, 'max': 0.0}, {'current': 2902.289, 'min': 0.0, 'max': 0.0}, {'current': 3193.614, 'min': 0.0, 'max': 0.0}, {'current': 3132.908, 'min': 0.0, 'max': 0.0}, {'current': 3221.533, 'min': 0.0, 'max': 0.0}, {'current': 3082.135, 'min': 0.0, 'max': 0.0}, {'current': 3036.898, 'min': 0.0, 'max': 0.0}, {'current': 3596.595, 'min': 0.0, 'max': 0.0}, {'current': 3185.956, 'min': 0.0, 'max': 0.0}, {'current': 3178.002, 'min': 0.0, 'max': 0.0}, {'current': 3186.383, 'min': 0.0, 'max': 0.0}, {'current': 3138.284, 'min': 0.0, 'max': 0.0}, {'current': 2890.053, 'min': 0.0, 'max': 0.0}, {'current': 2878.155, 'min': 0.0, 'max': 0.0}, {'current': 2943.671, 'min': 0.0, 'max': 0.0}, {'current': 2924.089, 'min': 0.0, 'max': 0.0}, {'current': 2461.058, 'min': 0.0, 'max': 0.0}, {'current': 2961.225, 'min': 0.0, 'max': 0.0}, {'current': 3097.346, 'min': 0.0, 'max': 0.0}, {'current': 2638.607, 'min': 0.0, 'max': 0.0}, {'current': 3267.369, 'min': 0.0, 'max': 0.0}, {'current': 3301.989, 'min': 0.0, 'max': 0.0}, {'current': 3255.895, 'min': 0.0, 'max': 0.0}, {'current': 3305.783, 'min': 0.0, 'max': 0.0}, {'current': 3320.452, 'min': 0.0, 'max': 0.0}, {'current': 3278.446, 'min': 0.0, 'max': 0.0}, {'current': 3598.093, 'min': 0.0, 'max': 0.0}, {'current': 3266.814, 'min': 0.0, 'max': 0.0}, {'current': 3596.43, 'min': 0.0, 'max': 0.0}, {'current': 3270.648, 'min': 0.0, 'max': 0.0}, {'current': 3505.783, 'min': 0.0, 'max': 0.0}, {'current': 3297.048, 'min': 0.0, 'max': 0.0}, {'current': 3264.728, 'min': 0.0, 'max': 0.0}, {'current': 3224.761, 'min': 0.0, 'max': 0.0}, {'current': 3342.449, 'min': 0.0, 'max': 0.0}, {'current': 3342.148, 'min': 0.0, 'max': 0.0}, {'current': 3597.921, 'min': 0.0, 'max': 0.0}, {'current': 3251.183, 'min': 0.0, 'max': 0.0}, {'current': 3533.37, 'min': 0.0, 'max': 0.0}, {'current': 3446.582, 'min': 0.0, 'max': 0.0}, {'current': 3261.516, 'min': 0.0, 'max': 0.0}, {'current': 3254.535, 'min': 0.0, 'max': 0.0}, {'current': 3261.428, 'min': 0.0, 'max': 0.0}, {'current': 3262.921, 'min': 0.0, 'max': 0.0}, {'current': 3276.045, 'min': 0.0, 'max': 0.0}, {'current': 3266.835, 'min': 0.0, 'max': 0.0}, {'current': 2751.168, 'min': 0.0, 'max': 0.0}, {'current': 3167.713, 'min': 0.0, 'max': 0.0}, {'current': 3180.263, 'min': 0.0, 'max': 0.0}, {'current': 3203.948, 'min': 0.0, 'max': 0.0}, {'current': 3234.562, 'min': 0.0, 'max': 0.0}, {'current': 3486.665, 'min': 0.0, 'max': 0.0}, {'current': 2789.289, 'min': 0.0, 'max': 0.0}, {'current': 2859.707, 'min': 0.0, 'max': 0.0}, {'current': 3143.341, 'min': 0.0, 'max': 0.0}, {'current': 3089.871, 'min': 0.0, 'max': 0.0}, {'current': 2266.761, 'min': 0.0, 'max': 0.0}, {'current': 2745.206, 'min': 0.0, 'max': 0.0}, {'current': 2832.943, 'min': 0.0, 'max': 0.0}, {'current': 2820.125, 'min': 0.0, 'max': 0.0}, {'current': 3202.152, 'min': 0.0, 'max': 0.0}, {'current': 3127.913, 'min': 0.0, 'max': 0.0}, {'current': 3598.345, 'min': 0.0, 'max': 0.0}, {'current': 3220.73, 'min': 0.0, 'max': 0.0}, {'current': 3025.305, 'min': 0.0, 'max': 0.0}, {'current': 3391.839, 'min': 0.0, 'max': 0.0}, {'current': 3119.74, 'min': 0.0, 'max': 0.0}, {'current': 3231.315, 'min': 0.0, 'max': 0.0}, {'current': 2396.33, 'min': 0.0, 'max': 0.0}, {'current': 2423.797, 'min': 0.0, 'max': 0.0}, {'current': 2527.72, 'min': 0.0, 'max': 0.0}, {'current': 2467.572, 'min': 0.0, 'max': 0.0}, {'current': 2425.179, 'min': 0.0, 'max': 0.0}, {'current': 2028.21, 'min': 0.0, 'max': 0.0}, {'current': 2503.85, 'min': 0.0, 'max': 0.0}, {'current': 2452.12, 'min': 0.0, 'max': 0.0}, {'current': 3075.121, 'min': 0.0, 'max': 0.0}, {'current': 3222.332, 'min': 0.0, 'max': 0.0}, {'current': 3233.386, 'min': 0.0, 'max': 0.0}, {'current': 3200.352, 'min': 0.0, 'max': 0.0}, {'current': 3202.276, 'min': 0.0, 'max': 0.0}, {'current': 3598.346, 'min': 0.0, 'max': 0.0}, {'current': 3254.354, 'min': 0.0, 'max': 0.0}, {'current': 3379.901, 'min': 0.0, 'max': 0.0}, {'current': 3594.797, 'min': 0.0, 'max': 0.0}, {'current': 3225.912, 'min': 0.0, 'max': 0.0}, {'current': 3223.292, 'min': 0.0, 'max': 0.0}, {'current': 3225.046, 'min': 0.0, 'max': 0.0}, {'current': 3214.566, 'min': 0.0, 'max': 0.0}, {'current': 3280.304, 'min': 0.0, 'max': 0.0}, {'current': 3169.07, 'min': 0.0, 'max': 0.0}, {'current': 3225.192, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 119.94140625, 'used': 56.40110397338867}}, 'gpu': 'NVIDIA H100 80GB HBM3', 'gpu_count': 8, 'gpu_devices': [{'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}], 'memory': {'total': 1999.9661331176758}}
+2024-11-13 17:10:08,005 INFO    HandlerThread:1939 [system_monitor.py:probe():224] Finished collecting system info
+2024-11-13 17:10:08,005 INFO    HandlerThread:1939 [system_monitor.py:probe():227] Publishing system info
+2024-11-13 17:10:08,006 DEBUG   HandlerThread:1939 [system_info.py:_save_conda():208] Saving list of conda packages installed into the current environment
+2024-11-13 17:10:08,753 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml
+2024-11-13 17:10:22,112 DEBUG   HandlerThread:1939 [system_info.py:_save_conda():220] Saving conda packages done
+2024-11-13 17:10:22,112 DEBUG   HandlerThread:1939 [system_info.py:_save_code():45] Saving code
+2024-11-13 17:10:22,117 DEBUG   HandlerThread:1939 [system_info.py:_save_code():66] Saving code done
+2024-11-13 17:10:22,117 DEBUG   HandlerThread:1939 [system_info.py:_save_patches():83] Saving git patches
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training/sft.py
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training
+2024-11-13 17:10:22,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning
+2024-11-13 17:10:22,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code
+2024-11-13 17:10:22,764 DEBUG   HandlerThread:1939 [system_info.py:_save_patches():125] Saving git patches done
+2024-11-13 17:10:22,766 INFO    HandlerThread:1939 [system_monitor.py:probe():229] Finished publishing system info
+2024-11-13 17:10:22,767 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: keepalive
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: keepalive
+2024-11-13 17:10:22,768 DEBUG   SenderThread:1939 [sender.py:send():382] send: files
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-metadata.json with policy now
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file code/qlearning_reasoning/training/sft.py with policy now
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file diff.patch with policy now
+2024-11-13 17:10:22,773 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: python_packages
+2024-11-13 17:10:22,773 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: python_packages
+2024-11-13 17:10:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:22,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:22,923 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,924 DEBUG   SenderThread:1939 [sender.py:send():382] send: config
+2024-11-13 17:10:22,924 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:22,925 WARNING SenderThread:1939 [sender.py:send_metric():1354] Seen metric with glob (shouldn't happen)
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: config
+2024-11-13 17:10:23,079 INFO    wandb-upload_1:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/yx5qp0zp-code/qlearning_reasoning/training/sft.py
+2024-11-13 17:10:23,081 INFO    wandb-upload_0:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/ohhel8zq-wandb-metadata.json
+2024-11-13 17:10:23,084 INFO    wandb-upload_2:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/o4jbd2x2-diff.patch
+2024-11-13 17:10:23,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/requirements.txt
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-metadata.json
+2024-11-13 17:10:25,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:27,927 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:32,928 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:37,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:38,878 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:39,761 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:10:44,055 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:46,939 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:10:46,941 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:10:46,944 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:10:47,764 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:47,765 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:10:49,765 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:49,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:52,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:52,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:52,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:55,857 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:00,858 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:05,858 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:07,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:07,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:07,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:07,934 DEBUG   SystemMonitor:1939 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-11-13 17:11:07,937 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:11:11,483 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:11,774 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:11,774 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:11:16,645 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:21,646 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:22,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:26,930 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:31,930 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:35,784 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:37,312 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:37,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:37,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:37,941 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:11:42,943 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:47,944 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:52,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:52,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:53,939 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:57,792 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:59,512 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:04,513 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:07,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:07,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:07,944 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:12:09,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:14,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:18,339 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:12:18,341 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:12:18,341 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:12:18,341 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:12:18,801 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:12:19,801 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:19,952 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:12:19,954 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,955 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:19,955 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,956 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,957 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:12:19,957 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:12:19,957 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:12:20,802 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:12:21,802 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:22,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:22,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:25,846 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:30,847 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:35,847 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:37,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:37,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:37,946 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:12:40,948 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:43,811 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:46,900 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:47,812 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:12:52,087 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:57,926 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:02,927 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:07,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:07,820 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:07,949 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:13:07,950 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:12,951 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:17,952 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:22,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:22,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:22,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:23,932 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:29,529 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:29,829 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:34,530 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:37,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:37,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:37,952 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:13:39,954 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:44,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:49,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:51,838 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:52,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:55,936 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:00,937 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:05,938 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:07,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:07,819 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:07,954 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:14:10,956 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:12,899 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:14:12,900 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:14:12,901 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:14:12,902 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:14:13,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:14:13,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:14,513 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:14:14,514 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:14:14,514 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:14:14,516 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:14:14,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:14:15,848 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:16,517 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:21,517 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:22,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:22,777 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:26,902 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:31,903 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:37,269 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:37,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:37,778 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:37,857 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:37,957 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:14:42,959 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:47,960 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:52,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:52,819 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:53,918 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:58,973 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:59,866 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:15:03,974 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:07,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:07,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:07,778 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:07,960 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:15:09,962 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:14,963 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:19,963 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:24,560 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:24,560 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:24,760 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:25,654 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:30,654 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:35,655 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:37,965 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:15:38,559 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:38,559 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:38,599 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:40,718 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:45,718 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:50,719 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:53,891 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:15:55,441 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:55,632 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:55,633 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:55,738 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:01,306 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:06,307 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:07,966 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:16:08,649 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:08,805 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:08,805 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:09,899 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:11,308 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:11,900 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:13,900 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:15,902 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:16,682 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:17,903 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:19,904 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:21,862 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:21,905 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:23,906 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:26,484 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:27,824 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:28,965 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:28,965 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:33,084 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:37,969 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:16:38,971 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:41,636 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:42,736 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:42,737 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:44,879 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:49,879 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:54,880 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:56,904 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:56,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:56,908 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:57,922 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:00,014 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:05,015 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:07,971 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:17:08,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:10,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:10,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:10,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:15,586 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:20,587 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:23,906 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:25,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:25,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:26,585 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:29,937 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:32,376 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:37,377 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:37,975 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:17:38,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:40,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:40,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:42,574 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:47,575 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:51,945 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:52,901 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:53,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:55,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:55,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:58,561 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:03,562 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:07,977 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:18:08,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:08,979 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:10,424 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:10,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:11,623 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:18:11,625 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:18:11,625 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:18:11,626 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:18:11,953 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:18:12,953 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:13,237 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:18:13,239 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:18:13,240 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:18:13,241 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:18:13,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:18:13,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:14,242 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:14,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:19,242 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:23,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:24,243 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:25,427 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:25,427 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:29,574 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:34,575 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:37,980 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:18:38,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:38,963 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:39,981 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:40,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:40,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:45,524 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:50,525 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:53,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:55,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:55,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:55,571 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:00,972 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:19:01,259 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:06,259 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:07,982 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:19:08,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:19:10,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:19:10,427 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:19:11,531 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report

wandb/debug.log ADDED Viewed

	@@ -0,0 +1,30 @@

+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Current SDK version is 0.16.3
+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Configure stats pid to 173
+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from /opt/ml/code/wandb/settings
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'root_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'api_key': '***REDACTED***', 'project': 'sft-codecontests-1112', 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': 'qlearning_reasoning/training/sft.py', 'program_abspath': '/opt/ml/code/qlearning_reasoning/training/sft.py', 'program': '/opt/ml/code/qlearning_reasoning/training/sft.py'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:_log_setup():526] Logging user logs to /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug.log
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:_log_setup():527] Logging internal logs to /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug-internal.log
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():566] calling init triggers
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():573] wandb.init called with sweep_config: {}
+config: {'sagemaker_training_job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'batch_size': 64, 'cache_dir': '/opt/ml/data/input/.cache', 'dataset': 'code-contests', 'gradient_accumulation_steps': 8, 'logging_steps': 5, 'lr': '1e-5', 'max_seq_length': 2048, 'model_name': 'Qwen/Qwen2.5-Coder-7B-Instruct', 'num_train_epochs': 2, 'output_dir': '/opt/ml/output', 'push_to_hub': 'true', 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'sagemaker_container_log_level': 20, 'sagemaker_instance_type': 'ml.p5.48xlarge', 'sagemaker_job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'sagemaker_program': 'sft.py', 'sagemaker_region': 'us-east-1', 'sagemaker_submit_directory': 's3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz', 'sagemaker_torch_distributed_enabled': 'true', 'save_steps': 100, 'schedule': 'cosine', 'wandb_project': 'sft-codecontests-1112', 'weight_decay': 0.0, 'additional_framework_parameters': {'sagemaker_instance_type': 'ml.p5.48xlarge', 'sagemaker_torch_distributed_enabled': True}, 'channel_input_dirs': {}, 'current_host': 'algo-1', 'current_instance_group': 'homogeneousCluster', 'current_instance_group_hosts': ['algo-1'], 'current_instance_type': 'ml.p5.48xlarge', 'distribution_hosts': ['algo-1'], 'distribution_instance_groups': ['homogeneousCluster'], 'framework_module': 'sagemaker_pytorch_container.training:main', 'hosts': ['algo-1'], 'hyperparameters': {'batch_size': 64, 'cache_dir': '/opt/ml/data/input/.cache', 'dataset': 'code-contests', 'gradient_accumulation_steps': 8, 'logging_steps': 5, 'lr': '1e-5', 'max_seq_length': 2048, 'model_name': 'Qwen/Qwen2.5-Coder-7B-Instruct', 'num_train_epochs': 2, 'output_dir': '/opt/ml/model/', 'push_to_hub': True, 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'save_steps': 100, 'schedule': 'cosine', 'wandb_project': 'sft-codecontests-1112', 'weight_decay': 0.0}, 'input_config_dir': '/opt/ml/input/config', 'input_data_config': {}, 'input_dir': '/opt/ml/input', 'instance_groups': ['homogeneousCluster'], 'instance_groups_dict': {'homogeneousCluster': {'hosts': ['algo-1'], 'instance_group_name': 'homogeneousCluster', 'instance_type': 'ml.p5.48xlarge'}}, 'is_hetero': False, 'is_master': True, 'is_modelparallel_enabled': None, 'is_smddpmprun_installed': False, 'is_smddprun_installed': True, 'job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'log_level': 20, 'master_hostname': 'algo-1', 'model_dir': '/opt/ml/model', 'module_dir': 's3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz', 'module_name': '/opt/ml/code/qlearning_reasoning/training/sft', 'network_interface_name': 'eth0', 'num_cpus': 192, 'num_gpus': 8, 'num_neurons': 0, 'output_data_dir': '/opt/ml/output/data', 'output_intermediate_dir': '/opt/ml/output/intermediate', 'resource_config': {'current_group_name': 'homogeneousCluster', 'current_host': 'algo-1', 'current_instance_type': 'ml.p5.48xlarge', 'hosts': ['algo-1'], 'instance_groups': [{'hosts': ['algo-1'], 'instance_group_name': 'homogeneousCluster', 'instance_type': 'ml.p5.48xlarge'}], 'network_interface_name': 'eth0'}, 'user_entry_point': '/opt/ml/code/qlearning_reasoning/training/sft.py'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():616] starting backend
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():620] setting up manager
+2024-11-13 17:10:07,431 INFO    MainThread:173 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-11-13 17:10:07,432 INFO    MainThread:173 [wandb_init.py:init():628] backend started and connected
+2024-11-13 17:10:07,435 INFO    MainThread:173 [wandb_init.py:init():720] updated telemetry
+2024-11-13 17:10:07,442 INFO    MainThread:173 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
+2024-11-13 17:10:07,759 INFO    MainThread:173 [wandb_run.py:_on_init():2262] communicating current version
+2024-11-13 17:10:07,794 INFO    MainThread:173 [wandb_run.py:_on_init():2271] got version response upgrade_message: "wandb version 0.18.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-11-13 17:10:07,794 INFO    MainThread:173 [wandb_init.py:init():804] starting run threads in backend
+2024-11-13 17:10:22,774 INFO    MainThread:173 [wandb_run.py:_console_start():2241] atexit reg
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2096] redirect: wrap_raw
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2161] Wrapping output streams.
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2186] Redirects installed.
+2024-11-13 17:10:22,776 INFO    MainThread:173 [wandb_init.py:init():847] run started, returning control to user process
+2024-11-13 17:10:22,778 INFO    MainThread:173 [wandb_run.py:_config_callback():1343] config_cb None None {'vocab_size': 151671, 'max_position_embeddings': 32768, 'hidden_size': 3584, 'intermediate_size': 18944, 'num_hidden_layers': 28, 'num_attention_heads': 28, 'use_sliding_window': False, 'sliding_window': None, 'max_window_layers': 28, 'num_key_value_heads': 4, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000.0, 'rope_scaling': None, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'bfloat16', 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': False, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['Qwen2ForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'Qwen/Qwen2.5-Coder-7B-Instruct', '_attn_implementation_autoset': True, 'transformers_version': '4.46.0', 'model_type': 'qwen2', 'output_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 8, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 1e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 2, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/runs/Nov13_17-09-37_algo-1', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'epoch', 'save_steps': 100, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 5, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': ['full_shard', 'auto_wrap'], 'fsdp_min_num_params': 0, 'fsdp_config': {'activation_checkpointing': False, 'auto_wrap_policy': 'TRANSFORMER_BASED_WRAP', 'backward_prefetch': 'BACKWARD_PRE', 'cpu_ram_efficient_loading': True, 'forward_prefetch': False, 'offload_params': False, 'sharding_strategy': 'FULL_SHARD', 'state_dict_type': 'FULL_STATE_DICT', 'sync_module_states': True, 'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': {'use_reentrant': False}, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': None, 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'dataset_text_field': 'text', 'packing': False, 'max_seq_length': 2048, 'dataset_num_proc': None, 'dataset_batch_size': 64, 'model_init_kwargs': None, 'dataset_kwargs': {}, 'eval_packing': None, 'num_of_sequences': 1024, 'chars_per_token': '<CHARS_PER_TOKEN>', 'use_liger': False}
+2024-11-13 17:10:22,783 INFO    MainThread:173 [wandb_config.py:__setitem__():151] config set model/num_parameters = 951599936 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f533489f280>>
+2024-11-13 17:10:22,783 INFO    MainThread:173 [wandb_run.py:_config_callback():1343] config_cb model/num_parameters 951599936 None

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training/sft.py ADDED Viewed

	@@ -0,0 +1,249 @@

+from datasets import load_dataset, concatenate_datasets
+from transformers import AutoTokenizer, AutoModelForCausalLM, TrainingArguments
+import torch
+from transformers import get_constant_schedule_with_warmup, get_cosine_schedule_with_warmup, get_linear_schedule_with_warmup, get_inverse_sqrt_schedule
+from trl import SFTTrainer, SFTConfig, DataCollatorForCompletionOnlyLM
+import os
+from textwrap import dedent
+from absl import app, flags
+FLAGS = flags.FLAGS
+import warnings
+warnings.filterwarnings("ignore")
+from trl import setup_chat_format
+ALL_DATASET_NAMES = [
+    'prm800k',
+    'prm800k-improvement',
+    'math',
+    'math-v2',
+    'math-prm800k',
+    'math-revision',
+    'og-math',
+    'leetcode',
+    'taco',
+    'math-revision-onesamp',
+    'math-revision-onesamp-overlap',
+    'math-revision-onesamp-correct-overlap',
+    'math-revision-onesamp-correct-overlap',
+    'code-contests'
+]
+flags.DEFINE_enum('dataset', 'prm800k', ALL_DATASET_NAMES, 'Name of the dataset')
+flags.DEFINE_string('cache_dir', '/scratch/bclj/asingh15/.cache', 'Directory to store cache files')
+flags.DEFINE_string('output_dir', '/scratch/bclj/asingh15/sft_checkpoints/', 'Directory to store output files')
+flags.DEFINE_string('run_name', 'sft', 'Name of the run')
+flags.DEFINE_string('model_name', 'deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct', 'Name of the model')
+flags.DEFINE_string('token', None, 'Hugging Face API token')
+flags.DEFINE_string('wandb_project', 'sft-prm800k-pregen-0501', 'Wandb project name')
+flags.DEFINE_string('optim', 'adamw_torch', 'Optimizer')
+flags.DEFINE_string('schedule', 'constant', 'Learning rate schedule')
+flags.DEFINE_float('lr', 5e-5, 'Learning rate')
+flags.DEFINE_float('weight_decay', 0.0, 'Weight decay')
+flags.DEFINE_integer('warmup_steps', 0, 'Number of warmup steps')
+flags.DEFINE_integer('num_train_epochs', 1, 'Number of training epochs')
+flags.DEFINE_integer('batch_size', 256, 'Batch size')
+flags.DEFINE_integer('gradient_accumulation_steps', 64, 'Gradient accumulation steps')
+flags.DEFINE_integer('max_seq_length', 1024, 'Maximum sequence length')
+flags.DEFINE_integer('logging_steps', 100, 'Logging steps')
+flags.DEFINE_integer('save_steps', 1000, 'Save steps')
+flags.DEFINE_integer('seed', 42, 'Random seed')
+flags.DEFINE_string('fsdp', "full_shard auto_wrap", 'If to use FSDP')
+flags.DEFINE_string('fsdp_config', "qlearning_reasoning/accelerate_configs/fsdp_config.json", 'FSDP config to use.')
+flags.DEFINE_boolean("push_to_hub", False, "Should the model be uploaded to Huggingface hub?")
+flags.DEFINE_boolean('add_step_tokens', True, 'Add step tokens')
+flags.DEFINE_string("hub_model_id", None, "Hub model id. If not defined it will be truncated run name.")
+START_OF_STEP_TOKEN = '[STEP]'
+END_OF_STEP_TOKEN = '[/STEP]'
+START_OF_TURN_TOKEN = '[TURN]'
+END_OF_TURN_TOKEN = '[/TURN]'
+START_OF_REVISION_TOKEN = '[REVISION]'
+END_OF_REVISION_TOKEN = '[/REVISION]'
+def main(_):
+    if FLAGS.hub_model_id is None:
+        FLAGS.hub_model_id = FLAGS.run_name[:96]
+    if not os.path.exists(FLAGS.output_dir):
+        os.makedirs(FLAGS.output_dir, exist_ok=True)
+        os.makedirs(f"{FLAGS.output_dir}/{FLAGS.run_name}", exist_ok=True)
+    os.environ["WANDB_PROJECT"] = FLAGS.wandb_project
+    os.environ["WANDB_DIR"] = f"{FLAGS.output_dir}/{FLAGS.run_name}"
+    os.environ["WANDB_NAME"] = FLAGS.run_name
+    os.environ["HF_DATASETS_CACHE"] = FLAGS.cache_dir
+    shared_kwargs = dict(
+        cache_dir=FLAGS.cache_dir,
+        trust_remote_code=True,
+    )
+    tokenizer = AutoTokenizer.from_pretrained(
+        FLAGS.model_name,
+        **shared_kwargs,
+    )
+    if tokenizer.pad_token is None:
+        tokenizer.pad_token = tokenizer.eos_token
+    if FLAGS.add_step_tokens:
+        tokenizer.add_special_tokens(
+            {'additional_special_tokens': [START_OF_STEP_TOKEN, END_OF_STEP_TOKEN, START_OF_TURN_TOKEN, END_OF_TURN_TOKEN, START_OF_REVISION_TOKEN, END_OF_REVISION_TOKEN]}
+        )
+        print(f"Tokenizer vocab size: {len(tokenizer)}")
+        print('EOS token:', tokenizer.eos_token)
+        print('PAD token:', tokenizer.pad_token)
+        print('Special tokens:', tokenizer.special_tokens_map)
+    instruction_template = "# Question\n\n"
+    if FLAGS.dataset == 'prm800k':
+        dataset_name = 'Asap7772/sft_prm800k_processed'
+        response_template = "# Solution\n\n"
+    elif FLAGS.dataset == 'math':
+        dataset_name = 'Asap7772/sft_math_processed'
+        response_template = "# Solution\n\n"
+    elif FLAGS.dataset == 'math-prm800k':
+        dataset_name = ['Asap7772/sft_prm800k_processed', 'Asap7772/sft_math_processed']
+        response_template = "# Solution\n\n"
+    elif FLAGS.dataset == 'og-math':
+        dataset_name = 'Asap7772/hendrycks_math_sft_formatted'
+        response_template = "# Solution\n\n"
+    elif FLAGS.dataset == 'leetcode':
+        dataset_name = 'Asap7772/leetcode-rosetta-processed'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'prm800k-improvement':
+        dataset_name = 'Asap7772/prm800k_improvement_groundtruth_values'
+        instruction_template = 'Solution Steps:'
+        response_template = "Improved Step:"
+    elif FLAGS.dataset == 'taco':
+        dataset_name = 'Asap7772/TACO-Processed'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'math-revision':
+        dataset_name = 'Asap7772/hendrycks-math-mc-llama-sftnoic-revisions-filtered'
+        instruction_template = "# Question"
+        response_template = f"{END_OF_TURN_TOKEN}\n\n{START_OF_TURN_TOKEN}"
+    elif FLAGS.dataset == 'math-revision-ic':
+        dataset_name = 'Asap7772/hendrycks-math-mc-llama-revisions-filtered'
+        instruction_template = "# Question"
+        response_template = f"{END_OF_TURN_TOKEN}\n\n{START_OF_TURN_TOKEN}"
+    elif FLAGS.dataset == 'math-revision-onesamp':
+        dataset_name = 'Asap7772/hendrycks-math-onesamp-revision'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'math-revision-onesamp-overlap':
+        dataset_name = 'Asap7772/hendrycks-math-onesamp-revision-overlap'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'math-v2':
+        dataset_name = 'Asap7772/sft_math_405b'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'math-revision-onesamp-correct-overlap':
+        dataset_name = 'Asap7772/hendrycks-math-onesamp-revision-correct-overlap'
+        instruction_template = "# Question"
+        response_template = "# Solution"
+    elif FLAGS.dataset == 'code-contests':
+        dataset_name = 'Asap7772/code_contests'
+        instruction_template = "Q:"
+        response_template = "A:"
+    else:
+        raise ValueError(f"Invalid dataset: {FLAGS.dataset}")
+    if isinstance(dataset_name, list):
+        all_datasets = [load_dataset(name, cache_dir=FLAGS.cache_dir) for name in dataset_name]
+        train_dataset = concatenate_datasets([dataset['train'] for dataset in all_datasets])
+        eval_dataset = concatenate_datasets([dataset['test'] for dataset in all_datasets])
+        print(f"example: {train_dataset[0]}")
+    elif isinstance(dataset_name, str):
+        dataset_dict = load_dataset(dataset_name, cache_dir=FLAGS.cache_dir)
+        train_dataset, eval_dataset = dataset_dict['train'], dataset_dict['test']
+    else:
+        raise ValueError(f"Invalid dataset name: {dataset_name}")
+    train_dataset, eval_dataset = train_dataset.shuffle(seed=FLAGS.seed), eval_dataset.shuffle(seed=FLAGS.seed)
+    num_train_epochs = FLAGS.num_train_epochs
+    def formatting_prompts_func(example):
+        output_texts = []
+        for i in range(len(example['text'])):
+            if FLAGS.dataset in ALL_DATASET_NAMES:
+                text = f"{example['text'][i]}{tokenizer.eos_token}"
+            else:
+                raise ValueError(f"Invalid dataset: {FLAGS.dataset}")
+            text = dedent(text).strip()
+            output_texts.append(text)
+        return output_texts
+    format_example = formatting_prompts_func(train_dataset[0:1])
+    print(f"Example formatted prompt: \n\n{format_example[0]}\n\n")
+    assert instruction_template in format_example[0], f"Instruction template not found in text."
+    assert response_template in format_example[0], f"Response template not found in text."
+    assert tokenizer.eos_token in format_example[0], f"EOS token not found in text."
+    instruction_template_ids = tokenizer.encode(instruction_template, add_special_tokens=False)[:2]
+    response_template_ids = tokenizer.encode(response_template, add_special_tokens=False)[:2]
+    collator = DataCollatorForCompletionOnlyLM(instruction_template=instruction_template_ids, response_template=response_template_ids, tokenizer=tokenizer, mlm=False)
+    model = AutoModelForCausalLM.from_pretrained(
+        FLAGS.model_name,
+        low_cpu_mem_usage=True,
+        torch_dtype=torch.bfloat16,
+        **shared_kwargs,
+    )
+    model.resize_token_embeddings(len(tokenizer))
+    if getattr(model, "config", None) is not None:
+        model.config.pad_token_id = tokenizer.pad_token_id
+        model.config.bos_token_id = tokenizer.bos_token_id
+        model.config.eos_token_id = tokenizer.eos_token_id
+    # Update the generation config to use the new eos & bos token
+    if getattr(model, "generation_config", None) is not None:
+        model.generation_config.bos_token_id = tokenizer.bos_token_id
+        model.generation_config.eos_token_id = tokenizer.eos_token_id
+        model.generation_config.pad_token_id = tokenizer.pad_token_id
+    model.config.use_cache = False
+    model.gradient_checkpointing_enable()
+    transformer_args = SFTConfig(
+        run_name=FLAGS.run_name,
+        output_dir=f"{FLAGS.output_dir}/{FLAGS.run_name}",
+        learning_rate=FLAGS.lr,
+        eval_strategy="steps",
+        logging_strategy="steps",
+        logging_first_step=True,
+        save_strategy="epoch",
+        dataset_batch_size=FLAGS.batch_size,
+        max_seq_length=FLAGS.max_seq_length,
+        gradient_accumulation_steps=FLAGS.gradient_accumulation_steps,
+        gradient_checkpointing_kwargs={'use_reentrant':False},
+        logging_steps=FLAGS.logging_steps,
+        save_steps=FLAGS.save_steps,
+        lr_scheduler_type=FLAGS.schedule,
+        optim=FLAGS.optim,
+        weight_decay=FLAGS.weight_decay,
+        warmup_steps=FLAGS.warmup_steps,
+        fsdp=FLAGS.fsdp,
+        fsdp_config=FLAGS.fsdp_config if FLAGS.fsdp != '' else None,
+        push_to_hub=FLAGS.push_to_hub,
+        num_train_epochs=num_train_epochs,
+        hub_model_id=FLAGS.hub_model_id
+    )
+    flags_dict = FLAGS.flag_values_dict()
+    trainer = SFTTrainer(
+        model=model,
+        args=transformer_args,
+        tokenizer=tokenizer,
+        train_dataset=train_dataset,
+        eval_dataset=eval_dataset,
+        formatting_func=formatting_prompts_func,
+        data_collator=collator,
+        dataset_batch_size=FLAGS.batch_size,
+    )
+    trainer.train()
+if __name__ == '__main__':
+    app.run(main)

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml ADDED Viewed

	@@ -0,0 +1,515 @@

+name: base
+channels:
+  - fastai
+  - nvidia
+  - https://aws-ml-conda.s3.us-west-2.amazonaws.com
+  - conda-forge
+dependencies:
+  - _libgcc_mutex=0.1=conda_forge
+  - _openmp_mutex=4.5=2_kmp_llvm
+  - alsa-lib=1.2.12=h4ab18f5_0
+  - annotated-types=0.7.0=pyhd8ed1ab_0
+  - asttokens=2.4.1=pyhd8ed1ab_0
+  - attr=2.5.1=h166bdaf_1
+  - aws-ofi-nccl=1.9.1=aws_efa1.26.1_0
+  - blas=1.0=mkl
+  - boltons=23.0.0=pyhd8ed1ab_0
+  - brotli-bin=1.1.0=hd590300_0
+  - bzip2=1.0.8=h7f98852_4
+  - c-ares=1.32.3=h4bc722e_0
+  - ca-certificates=2024.7.4=hbcca054_0
+  - cached-property=1.5.2=hd8ed1ab_1
+  - cached_property=1.5.2=pyha770c72_1
+  - cairo=1.18.0=h3faef2a_0
+  - catalogue=2.0.10=py310hff52083_0
+  - certifi=2024.7.4=pyhd8ed1ab_0
+  - cffi=1.15.1=py310h255011f_3
+  - charset-normalizer=3.2.0=pyhd8ed1ab_0
+  - click=8.1.7=unix_pyh707e725_0
+  - cloudpathlib=0.18.1=pyhd8ed1ab_0
+  - colorama=0.4.6=pyhd8ed1ab_0
+  - comm=0.2.2=pyhd8ed1ab_0
+  - conda=23.3.1=py310hff52083_0
+  - conda-libmamba-solver=23.3.0=pyhd8ed1ab_0
+  - conda-package-handling=2.2.0=pyh38be061_0
+  - conda-package-streaming=0.9.0=pyhd8ed1ab_0
+  - confection=0.1.4=py310h17c5347_0
+  - contourpy=1.2.1=py310hd41b1e2_0
+  - cuda-cccl=12.4.127=0
+  - cuda-compiler=12.1.1=0
+  - cuda-cudart=12.1.105=0
+  - cuda-cudart-dev=12.1.105=0
+  - cuda-cudart-static=12.1.105=0
+  - cuda-cuobjdump=12.4.127=0
+  - cuda-cupti=12.1.105=0
+  - cuda-cupti-static=12.1.105=0
+  - cuda-cuxxfilt=12.4.127=0
+  - cuda-driver-dev=12.4.127=0
+  - cuda-libraries=12.1.0=0
+  - cuda-libraries-dev=12.1.0=0
+  - cuda-libraries-static=12.1.1=0
+  - cuda-nvcc=12.1.105=0
+  - cuda-nvprune=12.4.127=0
+  - cuda-nvrtc=12.1.105=0
+  - cuda-nvrtc-dev=12.1.105=0
+  - cuda-nvrtc-static=12.1.105=0
+  - cuda-nvtx=12.1.105=0
+  - cuda-opencl=12.4.127=0
+  - cuda-opencl-dev=12.4.127=0
+  - cuda-profiler-api=12.4.127=0
+  - cuda-runtime=12.1.0=0
+  - cuda-version=12.1=h1d6eff3_3
+  - curl=8.8.0=he654da7_1
+  - cycler=0.12.1=pyhd8ed1ab_0
+  - cymem=2.0.8=py310hc6cd4ac_1
+  - cython=3.0.11=py310hea249c9_0
+  - cython-blis=0.7.10=py310h1f7b6fc_2
+  - dbus=1.13.6=h5008d03_3
+  - debugpy=1.8.5=py310hea249c9_0
+  - decorator=5.1.1=pyhd8ed1ab_0
+  - docutils=0.16=py310hff52083_4
+  - exceptiongroup=1.2.2=pyhd8ed1ab_0
+  - executing=2.0.1=pyhd8ed1ab_0
+  - expat=2.6.2=h59595ed_0
+  - fastai=2.7.16=py_0
+  - fastcore=1.5.55=py_0
+  - fastdownload=0.0.7=py_0
+  - fastprogress=1.0.3=py_0
+  - ffmpeg=4.2=h3fd9d12_1
+  - filelock=3.15.4=pyhd8ed1ab_0
+  - fmt=9.1.0=h924138e_0
+  - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
+  - font-ttf-inconsolata=3.000=h77eed37_0
+  - font-ttf-source-code-pro=2.038=h77eed37_0
+  - font-ttf-ubuntu=0.83=h77eed37_2
+  - fontconfig=2.14.2=h14ed4e7_0
+  - fonts-conda-ecosystem=1=0
+  - fonts-conda-forge=1=0
+  - fonttools=4.53.1=py310h5b4e0ec_0
+  - freetype=2.12.1=h267a509_2
+  - gettext=0.22.5=h59595ed_2
+  - gettext-tools=0.22.5=h59595ed_2
+  - glib=2.80.2=hf974151_0
+  - glib-tools=2.80.2=hb6ce0ca_0
+  - gmp=6.3.0=hac33072_2
+  - gmpy2=2.1.5=py310hc7909c9_1
+  - gnutls=3.6.15=he1e5248_0
+  - graphite2=1.3.13=h59595ed_1003
+  - gst-plugins-base=1.22.9=hfa15dee_1
+  - gstreamer=1.22.9=h98fc4e7_1
+  - h5py=3.11.0=nompi_py310hf054cd7_102
+  - harfbuzz=8.5.0=hfac3d4d_0
+  - hdf5=1.14.3=nompi_hdf9ad27_105
+  - hwloc=2.9.2=h2bc3f7f_0
+  - icu=73.2=h59595ed_0
+  - idna=3.7=pyhd8ed1ab_0
+  - importlib_metadata=8.2.0=hd8ed1ab_0
+  - jedi=0.19.1=pyhd8ed1ab_0
+  - jinja2=3.1.4=pyhd8ed1ab_0
+  - jmespath=1.0.1=pyhd8ed1ab_0
+  - joblib=1.4.2=pyhd8ed1ab_0
+  - jsonpatch=1.32=pyhd8ed1ab_0
+  - jsonpointer=2.0=py_0
+  - jupyter_client=8.6.2=pyhd8ed1ab_0
+  - jupyter_core=5.7.2=py310hff52083_0
+  - keyutils=1.6.1=h166bdaf_0
+  - kiwisolver=1.4.5=py310hd41b1e2_1
+  - krb5=1.21.3=h659f571_0
+  - lame=3.100=h166bdaf_1003
+  - langcodes=3.4.0=pyhd8ed1ab_0
+  - language-data=1.2.0=pyhd8ed1ab_0
+  - lcms2=2.16=hb7c19ff_0
+  - ld_impl_linux-64=2.40=h41732ed_0
+  - lerc=4.0.0=h27087fc_0
+  - libaec=1.1.3=h59595ed_0
+  - libarchive=3.6.2=h039dbb9_1
+  - libasprintf=0.22.5=h661eb56_2
+  - libasprintf-devel=0.22.5=h661eb56_2
+  - libblas=3.9.0=21_linux64_mkl
+  - libbrotlicommon=1.1.0=hd590300_0
+  - libbrotlidec=1.1.0=hd590300_0
+  - libbrotlienc=1.1.0=hd590300_0
+  - libcap=2.69=h0f662aa_0
+  - libcblas=3.9.0=21_linux64_mkl
+  - libclang=15.0.7=default_h127d8a8_5
+  - libclang13=15.0.7=default_h5d6823c_5
+  - libcublas=12.1.0.26=0
+  - libcublas-dev=12.1.0.26=0
+  - libcublas-static=12.1.3.1=hd3aeb46_0
+  - libcufft=11.0.2.4=0
+  - libcufft-dev=11.0.2.4=0
+  - libcufft-static=11.0.2.54=hd3aeb46_0
+  - libcufile=1.9.1.3=0
+  - libcufile-dev=1.9.1.3=0
+  - libcufile-static=1.9.1.3=0
+  - libcups=2.3.3=h4637d8d_4
+  - libcurand=10.3.5.147=0
+  - libcurand-dev=10.3.5.147=0
+  - libcurand-static=10.3.5.147=0
+  - libcurl=8.8.0=hca28451_1
+  - libcusolver=11.4.4.55=0
+  - libcusolver-dev=11.4.4.55=0
+  - libcusolver-static=11.4.5.107=hd3aeb46_0
+  - libcusparse=12.0.2.55=0
+  - libcusparse-dev=12.0.2.55=0
+  - libcusparse-static=12.1.0.106=hd3aeb46_0
+  - libdeflate=1.20=hd590300_0
+  - libedit=3.1.20191231=he28a2e2_2
+  - libev=4.33=h516909a_1
+  - libevent=2.1.12=hf998b51_1
+  - libexpat=2.6.2=h59595ed_0
+  - libffi=3.4.2=h7f98852_5
+  - libflac=1.4.3=h59595ed_0
+  - libgcc=7.2.0=h69d50b8_2
+  - libgcc-ng=13.1.0=he5830b7_0
+  - libgcrypt=1.11.0=h4ab18f5_1
+  - libgettextpo=0.22.5=h59595ed_2
+  - libgettextpo-devel=0.22.5=h59595ed_2
+  - libgfortran-ng=13.2.0=h69a702a_0
+  - libgfortran5=13.2.0=ha4646dd_0
+  - libglib=2.80.2=hf974151_0
+  - libgomp=13.1.0=he5830b7_0
+  - libgpg-error=1.50=h4f305b6_0
+  - libhwloc=2.9.3=default_h554bfaf_1009
+  - libiconv=1.17=h166bdaf_0
+  - libidn2=2.3.7=hd590300_0
+  - libjpeg-turbo=3.0.0=hd590300_1
+  - liblapack=3.9.0=21_linux64_mkl
+  - libllvm15=15.0.7=h5cf9203_3
+  - libmamba=1.4.2=hcea66bb_0
+  - libmambapy=1.4.2=py310h1428755_0
+  - libnghttp2=1.58.0=h47da74e_1
+  - libnl=3.10.0=h4bc722e_0
+  - libnpp=12.0.2.50=0
+  - libnpp-dev=12.0.2.50=0
+  - libnpp-static=12.1.0.40=hd3aeb46_0
+  - libnsl=2.0.0=h7f98852_0
+  - libnvjitlink=12.1.105=0
+  - libnvjitlink-dev=12.1.105=0
+  - libnvjitlink-static=12.1.105=hd3aeb46_0
+  - libnvjpeg=12.1.1.14=0
+  - libnvjpeg-dev=12.1.1.14=0
+  - libnvjpeg-static=12.2.0.2=ha770c72_0
+  - libogg=1.3.5=h4ab18f5_0
+  - libopenblas=0.3.27=pthreads_hac2b453_1
+  - libopus=1.3.1=h7f98852_1
+  - libpng=1.6.43=h2797004_0
+  - libpq=16.4=h482b261_0
+  - libsndfile=1.2.2=hc60ed4a_1
+  - libsodium=1.0.18=h36c2ea0_1
+  - libsolv=0.7.29=ha6fb4c9_0
+  - libsqlite=3.46.0=hde9e2c9_0
+  - libssh2=1.11.0=h0841786_0
+  - libstdcxx-ng=13.1.0=hfd8a6a1_0
+  - libsystemd0=255=h3516f8a_1
+  - libtasn1=4.19.0=h166bdaf_0
+  - libtiff=4.6.0=h1dd3fc0_3
+  - libunistring=0.9.10=h7f98852_0
+  - libuuid=2.38.1=h0b41bf4_0
+  - libuv=1.48.0=hd590300_0
+  - libvorbis=1.3.7=h9c3ff4c_0
+  - libwebp-base=1.4.0=hd590300_0
+  - libxcb=1.15=h0b41bf4_0
+  - libxkbcommon=1.6.0=h5d7e998_0
+  - libxml2=2.11.6=h232c23b_0
+  - libzlib=1.2.13=h4ab18f5_6
+  - llvm-openmp=18.1.7=ha31de31_0
+  - lz4-c=1.9.4=hcb278e6_0
+  - lzo=2.10=h516909a_1000
+  - mamba=1.4.2=py310h51d5547_0
+  - marisa-trie=1.1.0=py310hc6cd4ac_1
+  - markdown-it-py=3.0.0=pyhd8ed1ab_0
+  - markupsafe=2.1.5=py310h2372a71_0
+  - matplotlib=3.9.1=py310hff52083_1
+  - matplotlib-base=3.9.1=py310hf02ac8c_2
+  - matplotlib-inline=0.1.7=pyhd8ed1ab_0
+  - mdurl=0.1.2=pyhd8ed1ab_0
+  - mkl=2024.0.0=ha957f24_49657
+  - mkl-include=2024.2.0=ha957f24_665
+  - mpc=1.3.1=hfe3b2da_0
+  - mpfr=4.2.1=h38ae2d0_2
+  - mpg123=1.32.6=h59595ed_0
+  - mpi=1.0=openmpi
+  - mpi4py=3.1.6=py310hb2ba3f8_1
+  - mpmath=1.3.0=pyhd8ed1ab_0
+  - munkres=1.1.4=pyh9f0ad1d_0
+  - murmurhash=1.0.10=py310hc6cd4ac_1
+  - mysql-common=8.0.33=hf1915f5_6
+  - mysql-libs=8.0.33=hca2cd23_6
+  - ncurses=6.5=h59595ed_0
+  - nest-asyncio=1.6.0=pyhd8ed1ab_0
+  - nettle=3.7.3=hbbd107a_1
+  - networkx=3.3=pyhd8ed1ab_1
+  - nspr=4.35=h27087fc_0
+  - nss=3.100=hca3bf56_0
+  - openh264=2.1.1=h780b84a_0
+  - openjpeg=2.5.2=h488ebb8_0
+  - openmpi=5.0.3=h817cd4e_101
+  - openssl=3.3.1=h4bc722e_2
+  - packaging=23.1=pyhd8ed1ab_0
+  - pandas=2.2.2=py310hf9f9076_1
+  - parso=0.8.4=pyhd8ed1ab_0
+  - pcre2=10.43=hcad00b1_0
+  - pexpect=4.9.0=pyhd8ed1ab_0
+  - pickleshare=0.7.5=py_1003
+  - pillow=10.3.0=py310hf73ecf8_0
+  - pixman=0.43.2=h59595ed_0
+  - platformdirs=4.2.2=pyhd8ed1ab_0
+  - pluggy=1.3.0=pyhd8ed1ab_0
+  - ply=3.11=pyhd8ed1ab_2
+  - preshed=3.0.9=py310hc6cd4ac_1
+  - prompt-toolkit=3.0.47=pyha770c72_0
+  - psutil=6.0.0=py310hc51659f_0
+  - pthread-stubs=0.4=h36c2ea0_1001
+  - ptyprocess=0.7.0=pyhd3deb0d_0
+  - pulseaudio-client=16.1=hb77b528_5
+  - pure_eval=0.2.3=pyhd8ed1ab_0
+  - pyasn1=0.6.0=pyhd8ed1ab_0
+  - pybind11=2.13.1=py310h25c7140_0
+  - pybind11-abi=4=hd8ed1ab_3
+  - pybind11-global=2.13.1=py310h25c7140_0
+  - pycosat=0.6.4=py310h5764c6d_1
+  - pycparser=2.21=pyhd8ed1ab_0
+  - pydantic=2.8.2=pyhd8ed1ab_0
+  - pydantic-core=2.20.1=py310h42e942d_0
+  - pygments=2.18.0=pyhd8ed1ab_0
+  - pyparsing=3.1.2=pyhd8ed1ab_0
+  - pyqt=5.15.9=py310h04931ad_5
+  - pyqt5-sip=12.12.2=py310hc6cd4ac_5
+  - pysocks=1.7.1=pyha2e5f31_6
+  - python=3.10.12=hd12c33a_0_cpython
+  - python-dateutil=2.9.0=pyhd8ed1ab_0
+  - python-tzdata=2024.1=pyhd8ed1ab_0
+  - python_abi=3.10=3_cp310
+  - pytorch-cuda=12.1=ha16c6d3_5
+  - pytorch-mutex=1.0=cuda
+  - pytz=2024.1=pyhd8ed1ab_0
+  - pyyaml=6.0.2=py310h5b4e0ec_0
+  - pyzmq=26.1.0=py310h7d2b5bf_0
+  - qhull=2020.2=h434a139_5
+  - qt-main=5.15.8=h82b777d_17
+  - readline=8.2=h8228510_1
+  - reproc=14.2.4=h0b41bf4_0
+  - reproc-cpp=14.2.4=hcb278e6_0
+  - requests=2.32.3=pyhd8ed1ab_0
+  - rhash=1.4.4=hd590300_0
+  - rich=13.7.1=pyhd8ed1ab_0
+  - rsa=4.7.2=pyh44b312d_0
+  - ruamel.yaml=0.17.32=py310h2372a71_0
+  - ruamel.yaml.clib=0.2.7=py310h1fa729e_1
+  - s3transfer=0.10.2=pyhd8ed1ab_0
+  - scipy=1.14.0=py310h93e2701_1
+  - shellingham=1.5.4=pyhd8ed1ab_0
+  - sip=6.7.12=py310hc6cd4ac_0
+  - six=1.16.0=pyh6c4a22f_0
+  - smart-open=7.0.4=hd8ed1ab_0
+  - smart_open=7.0.4=pyhd8ed1ab_0
+  - spacy=3.7.5=py310h9fd543b_1
+  - spacy-legacy=3.0.12=pyhd8ed1ab_0
+  - spacy-loggers=1.0.5=pyhd8ed1ab_0
+  - srsly=2.4.8=py310hc6cd4ac_1
+  - stack_data=0.6.2=pyhd8ed1ab_0
+  - sympy=1.13.0=pypyh2585a3b_103
+  - tbb=2021.8.0=hdb19cb5_0
+  - thinc=8.2.5=py310h9fd543b_0
+  - threadpoolctl=3.5.0=pyhc1e730c_0
+  - tk=8.6.13=noxft_h4845f30_101
+  - toml=0.10.2=pyhd8ed1ab_0
+  - tomli=2.0.1=pyhd8ed1ab_0
+  - toolz=0.12.0=pyhd8ed1ab_0
+  - torchdata=0.7.0=py310
+  - torchtext=0.16.0=py310
+  - tornado=6.4.1=py310hc51659f_0
+  - tqdm=4.66.5=pyhd8ed1ab_0
+  - traitlets=5.14.3=pyhd8ed1ab_0
+  - typer=0.12.3=pyhd8ed1ab_0
+  - typer-slim=0.12.3=pyhd8ed1ab_0
+  - typer-slim-standard=0.12.3=hd8ed1ab_0
+  - typing=3.10.0.0=pyhd8ed1ab_1
+  - typing-extensions=4.12.2=hd8ed1ab_0
+  - typing_extensions=4.12.2=pyha770c72_0
+  - tzdata=2023c=h71feb2d_0
+  - unicodedata2=15.1.0=py310h2372a71_0
+  - urllib3=1.26.19=pyhd8ed1ab_0
+  - wasabi=1.1.2=py310hff52083_1
+  - wcwidth=0.2.13=pyhd8ed1ab_0
+  - weasel=0.4.1=pyhd8ed1ab_1
+  - wheel=0.41.2=pyhd8ed1ab_0
+  - wrapt=1.16.0=py310h2372a71_0
+  - xcb-util=0.4.0=hd590300_1
+  - xcb-util-image=0.4.0=h8ee46fc_1
+  - xcb-util-keysyms=0.4.0=h8ee46fc_1
+  - xcb-util-renderutil=0.3.9=hd590300_1
+  - xcb-util-wm=0.4.1=h8ee46fc_1
+  - xkeyboard-config=2.42=h4ab18f5_0
+  - xorg-kbproto=1.0.7=h7f98852_1002
+  - xorg-libice=1.1.1=hd590300_0
+  - xorg-libsm=1.2.4=h7391055_0
+  - xorg-libx11=1.8.9=h8ee46fc_0
+  - xorg-libxau=1.0.11=hd590300_0
+  - xorg-libxdmcp=1.1.3=h7f98852_0
+  - xorg-libxext=1.3.4=h0b41bf4_2
+  - xorg-libxrender=0.9.11=hd590300_0
+  - xorg-renderproto=0.11.1=h7f98852_1002
+  - xorg-xextproto=7.3.0=h0b41bf4_1003
+  - xorg-xf86vidmodeproto=2.3.1=h7f98852_1002
+  - xorg-xproto=7.0.31=h7f98852_1007
+  - xz=5.2.6=h166bdaf_0
+  - yaml=0.2.5=h7f98852_2
+  - yaml-cpp=0.7.0=h27087fc_2
+  - zeromq=4.3.5=h75354e8_4
+  - zipp=3.19.2=pyhd8ed1ab_0
+  - zlib=1.2.13=h4ab18f5_6
+  - zstandard=0.19.0=py310h5764c6d_0
+  - zstd=1.5.6=ha6fb4c9_0
+  - pip:
+      - absl-py==2.1.0
+      - accelerate==1.1.1
+      - aiohappyeyeballs==2.4.3
+      - aiohttp==3.10.10
+      - aiosignal==1.3.1
+      - antlr4-python3-runtime==4.9.3
+      - apex==0.1
+      - appdirs==1.4.4
+      - argparse==1.4.0
+      - async-timeout==4.0.3
+      - attrdict==2.0.1
+      - attrs==23.2.0
+      - awscli==1.33.40
+      - backcall==0.2.0
+      - bcrypt==4.2.0
+      - beautifulsoup4==4.12.3
+      - bleach==6.2.0
+      - bokeh==3.5.1
+      - boto3==1.34.158
+      - botocore==1.34.158
+      - brotli==1.0.9
+      - cachetools==5.5.0
+      - chardet==5.2.0
+      - cloudpickle==2.2.1
+      - cmake==3.30.2
+      - cryptography==41.0.7
+      - datasets==3.1.0
+      - defusedxml==0.7.1
+      - dill==0.3.8
+      - docker==7.1.0
+      - docker-pycreds==0.4.0
+      - docopt==0.6.2
+      - docstring-parser==0.16
+      - einops==0.8.0
+      - fastjsonschema==2.20.0
+      - fire==0.6.0
+      - flash-attn==2.5.5
+      - frozenlist==1.5.0
+      - fsspec==2024.6.1
+      - gevent==24.2.1
+      - gitdb==4.0.11
+      - gitpython==3.1.43
+      - google-pasta==0.2.0
+      - greenlet==3.0.3
+      - huggingface-hub==0.26.2
+      - hydra-core==1.3.2
+      - imageio==2.34.2
+      - importlib-metadata==6.11.0
+      - importlib-resources==6.1.1
+      - inotify-simple==1.2.1
+      - ipykernel==6.29.1
+      - ipython==8.12.3
+      - jsonschema==4.23.0
+      - jsonschema-specifications==2023.12.1
+      - jupyterlab-pygments==0.3.0
+      - llvmlite==0.43.0
+      - mistune==3.0.2
+      - multidict==6.1.0
+      - multiprocess==0.70.16
+      - nbclient==0.10.0
+      - nbconvert==7.16.4
+      - nbformat==5.10.4
+      - ninja==1.11.1.1
+      - numba==0.60.0
+      - numpy==1.24.3
+      - nvidia-cublas-cu12==12.1.3.1
+      - nvidia-cuda-cupti-cu12==12.1.105
+      - nvidia-cuda-nvrtc-cu12==12.1.105
+      - nvidia-cuda-runtime-cu12==12.1.105
+      - nvidia-cudnn-cu12==8.9.2.26
+      - nvidia-cufft-cu12==11.0.2.54
+      - nvidia-curand-cu12==10.3.2.106
+      - nvidia-cusolver-cu12==11.4.5.107
+      - nvidia-cusparse-cu12==12.1.0.106
+      - nvidia-ml-py==12.535.161
+      - nvidia-nccl-cu12==2.19.3
+      - nvidia-nvjitlink-cu12==12.6.77
+      - nvidia-nvtx-cu12==12.1.105
+      - nvitop==1.3.2
+      - omegaconf==2.3.0
+      - opencv-python==4.10.0.84
+      - pandocfilters==1.5.1
+      - paramiko==3.4.0
+      - pathos==0.3.2
+      - pip==24.1.2
+      - pip-chill==1.0.3
+      - pipreqs==0.5.0
+      - plotly==5.23.0
+      - pox==0.3.4
+      - ppft==1.7.6.8
+      - propcache==0.2.0
+      - protobuf==3.20.3
+      - pyarrow==17.0.0
+      - pyfunctional==1.5.0
+      - pynacl==1.5.0
+      - pyopenssl==23.2.0
+      - referencing==0.35.1
+      - regex==2024.11.6
+      - retrying==1.3.4
+      - rpds-py==0.20.0
+      - s3fs==0.4.2
+      - safetensors==0.4.5
+      - sagemaker==2.224.2
+      - sagemaker-experiments==0.1.45
+      - sagemaker-pytorch-training==2.8.1
+      - sagemaker-training==4.8.1
+      - schema==0.7.7
+      - scikit-learn==1.3.2
+      - seaborn==0.13.2
+      - sentencepiece==0.2.0
+      - sentry-sdk==2.18.0
+      - setproctitle==1.3.3
+      - setuptools==72.1.0
+      - shap==0.46.0
+      - shtab==1.7.1
+      - slicer==0.0.8
+      - smclarify==0.5
+      - smdebug-rulesconfig==1.0.1
+      - smdistributed-dataparallel==2.1.0
+      - smmap==5.0.1
+      - smprof==0.3.334
+      - soupsieve==2.6
+      - tabulate==0.9.0
+      - tblib==3.0.0
+      - tenacity==9.0.0
+      - tensor-parallel==2.0.0
+      - termcolor==2.5.0
+      - tinycss2==1.4.0
+      - tokenizers==0.20.3
+      - torch==2.2.0
+      - torchaudio==2.2.0
+      - torchnet==0.0.4
+      - torchvision==0.17.0
+      - transformer-engine==0.12.0+170797
+      - transformers==4.46.0
+      - triton==2.2.0
+      - trl==0.12.0
+      - tyro==0.8.5
+      - visdom==0.2.4
+      - wandb==0.16.3
+      - webencodings==0.5.1
+      - websocket-client==1.8.0
+      - werkzeug==3.0.3
+      - xxhash==3.5.0
+      - xyzservices==2024.6.0
+      - yarg==0.1.9
+      - yarl==1.17.1
+      - zope-event==5.0
+      - zope-interface==7.0.1
+prefix: /opt/conda

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml ADDED Viewed

	@@ -0,0 +1,948 @@

+wandb_version: 1
+sagemaker_training_job_name:
+  desc: null
+  value: kushalarora-rvv-main-2024-11-13-16-43-09-915
+batch_size:
+  desc: null
+  value: 64
+cache_dir:
+  desc: null
+  value: /opt/ml/data/input/.cache
+dataset:
+  desc: null
+  value: code-contests
+gradient_accumulation_steps:
+  desc: null
+  value: 8
+logging_steps:
+  desc: null
+  value: 5
+lr:
+  desc: null
+  value: 1e-5
+max_seq_length:
+  desc: null
+  value: 2048
+model_name:
+  desc: null
+  value: Qwen/Qwen2.5-Coder-7B-Instruct
+num_train_epochs:
+  desc: null
+  value: 2
+output_dir:
+  desc: null
+  value: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048
+push_to_hub:
+  desc: null
+  value: true
+run_name:
+  desc: null
+  value: sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048
+sagemaker_container_log_level:
+  desc: null
+  value: 20
+sagemaker_instance_type:
+  desc: null
+  value: ml.p5.48xlarge
+sagemaker_job_name:
+  desc: null
+  value: kushalarora-rvv-main-2024-11-13-16-43-09-915
+sagemaker_program:
+  desc: null
+  value: sft.py
+sagemaker_region:
+  desc: null
+  value: us-east-1
+sagemaker_submit_directory:
+  desc: null
+  value: s3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz
+sagemaker_torch_distributed_enabled:
+  desc: null
+  value: 'true'
+save_steps:
+  desc: null
+  value: 100
+schedule:
+  desc: null
+  value: cosine
+wandb_project:
+  desc: null
+  value: sft-codecontests-1112
+weight_decay:
+  desc: null
+  value: 0.0
+additional_framework_parameters:
+  desc: null
+  value:
+    sagemaker_instance_type: ml.p5.48xlarge
+    sagemaker_torch_distributed_enabled: true
+channel_input_dirs:
+  desc: null
+  value: {}
+current_host:
+  desc: null
+  value: algo-1
+current_instance_group:
+  desc: null
+  value: homogeneousCluster
+current_instance_group_hosts:
+  desc: null
+  value:
+  - algo-1
+current_instance_type:
+  desc: null
+  value: ml.p5.48xlarge
+distribution_hosts:
+  desc: null
+  value:
+  - algo-1
+distribution_instance_groups:
+  desc: null
+  value:
+  - homogeneousCluster
+framework_module:
+  desc: null
+  value: sagemaker_pytorch_container.training:main
+hosts:
+  desc: null
+  value:
+  - algo-1
+hyperparameters:
+  desc: null
+  value:
+    batch_size: 64
+    cache_dir: /opt/ml/data/input/.cache
+    dataset: code-contests
+    gradient_accumulation_steps: 8
+    logging_steps: 5
+    lr: 1e-5
+    max_seq_length: 2048
+    model_name: Qwen/Qwen2.5-Coder-7B-Instruct
+    num_train_epochs: 2
+    output_dir: /opt/ml/model/
+    push_to_hub: true
+    run_name: sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048
+    save_steps: 100
+    schedule: cosine
+    wandb_project: sft-codecontests-1112
+    weight_decay: 0.0
+input_config_dir:
+  desc: null
+  value: /opt/ml/input/config
+input_data_config:
+  desc: null
+  value: {}
+input_dir:
+  desc: null
+  value: /opt/ml/input
+instance_groups:
+  desc: null
+  value:
+  - homogeneousCluster
+instance_groups_dict:
+  desc: null
+  value:
+    homogeneousCluster:
+      hosts:
+      - algo-1
+      instance_group_name: homogeneousCluster
+      instance_type: ml.p5.48xlarge
+is_hetero:
+  desc: null
+  value: false
+is_master:
+  desc: null
+  value: true
+is_modelparallel_enabled:
+  desc: null
+  value: null
+is_smddpmprun_installed:
+  desc: null
+  value: false
+is_smddprun_installed:
+  desc: null
+  value: true
+job_name:
+  desc: null
+  value: kushalarora-rvv-main-2024-11-13-16-43-09-915
+log_level:
+  desc: null
+  value: passive
+master_hostname:
+  desc: null
+  value: algo-1
+model_dir:
+  desc: null
+  value: /opt/ml/model
+module_dir:
+  desc: null
+  value: s3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz
+module_name:
+  desc: null
+  value: /opt/ml/code/qlearning_reasoning/training/sft
+network_interface_name:
+  desc: null
+  value: eth0
+num_cpus:
+  desc: null
+  value: 192
+num_gpus:
+  desc: null
+  value: 8
+num_neurons:
+  desc: null
+  value: 0
+output_data_dir:
+  desc: null
+  value: /opt/ml/output/data
+output_intermediate_dir:
+  desc: null
+  value: /opt/ml/output/intermediate
+resource_config:
+  desc: null
+  value:
+    current_group_name: homogeneousCluster
+    current_host: algo-1
+    current_instance_type: ml.p5.48xlarge
+    hosts:
+    - algo-1
+    instance_groups:
+    - hosts:
+      - algo-1
+      instance_group_name: homogeneousCluster
+      instance_type: ml.p5.48xlarge
+    network_interface_name: eth0
+user_entry_point:
+  desc: null
+  value: /opt/ml/code/qlearning_reasoning/training/sft.py
+_wandb:
+  desc: null
+  value:
+    code_path: code/qlearning_reasoning/training/sft.py
+    python_version: 3.10.12
+    cli_version: 0.16.3
+    framework: huggingface
+    huggingface_version: 4.46.0
+    is_jupyter_run: false
+    is_kaggle_kernel: false
+    start_time: 1731517807.43302
+    t:
+      1:
+      - 1
+      - 5
+      - 11
+      - 41
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      2:
+      - 1
+      - 5
+      - 11
+      - 41
+      - 49
+      - 51
+      - 53
+      - 55
+      - 71
+      - 84
+      3:
+      - 7
+      - 9
+      - 13
+      - 19
+      - 23
+      4: 3.10.12
+      5: 0.16.3
+      6: 4.46.0
+      8:
+      - 5
+      9:
+        1: transformers_trainer
+      13: linux-x86_64
+    m:
+    - 1: train/global_step
+      6:
+      - 3
+    - 1: train/loss
+      5: 1
+      6:
+      - 1
+    - 1: train/grad_norm
+      5: 1
+      6:
+      - 1
+    - 1: train/learning_rate
+      5: 1
+      6:
+      - 1
+    - 1: train/epoch
+      5: 1
+      6:
+      - 1
+    - 1: eval/loss
+      5: 1
+      6:
+      - 1
+    - 1: eval/runtime
+      5: 1
+      6:
+      - 1
+    - 1: eval/samples_per_second
+      5: 1
+      6:
+      - 1
+    - 1: eval/steps_per_second
+      5: 1
+      6:
+      - 1
+vocab_size:
+  desc: null
+  value: 151671
+max_position_embeddings:
+  desc: null
+  value: 32768
+hidden_size:
+  desc: null
+  value: 3584
+intermediate_size:
+  desc: null
+  value: 18944
+num_hidden_layers:
+  desc: null
+  value: 28
+num_attention_heads:
+  desc: null
+  value: 28
+use_sliding_window:
+  desc: null
+  value: false
+sliding_window:
+  desc: null
+  value: null
+max_window_layers:
+  desc: null
+  value: 28
+num_key_value_heads:
+  desc: null
+  value: 4
+hidden_act:
+  desc: null
+  value: silu
+initializer_range:
+  desc: null
+  value: 0.02
+rms_norm_eps:
+  desc: null
+  value: 1.0e-06
+use_cache:
+  desc: null
+  value: false
+rope_theta:
+  desc: null
+  value: 1000000.0
+rope_scaling:
+  desc: null
+  value: null
+attention_dropout:
+  desc: null
+  value: 0.0
+return_dict:
+  desc: null
+  value: true
+output_hidden_states:
+  desc: null
+  value: false
+output_attentions:
+  desc: null
+  value: false
+torchscript:
+  desc: null
+  value: false
+torch_dtype:
+  desc: null
+  value: bfloat16
+use_bfloat16:
+  desc: null
+  value: false
+tf_legacy_loss:
+  desc: null
+  value: false
+pruned_heads:
+  desc: null
+  value: {}
+tie_word_embeddings:
+  desc: null
+  value: false
+chunk_size_feed_forward:
+  desc: null
+  value: 0
+is_encoder_decoder:
+  desc: null
+  value: false
+is_decoder:
+  desc: null
+  value: false
+cross_attention_hidden_size:
+  desc: null
+  value: null
+add_cross_attention:
+  desc: null
+  value: false
+tie_encoder_decoder:
+  desc: null
+  value: false
+max_length:
+  desc: null
+  value: 20
+min_length:
+  desc: null
+  value: 0
+do_sample:
+  desc: null
+  value: false
+early_stopping:
+  desc: null
+  value: false
+num_beams:
+  desc: null
+  value: 1
+num_beam_groups:
+  desc: null
+  value: 1
+diversity_penalty:
+  desc: null
+  value: 0.0
+temperature:
+  desc: null
+  value: 1.0
+top_k:
+  desc: null
+  value: 50
+top_p:
+  desc: null
+  value: 1.0
+typical_p:
+  desc: null
+  value: 1.0
+repetition_penalty:
+  desc: null
+  value: 1.0
+length_penalty:
+  desc: null
+  value: 1.0
+no_repeat_ngram_size:
+  desc: null
+  value: 0
+encoder_no_repeat_ngram_size:
+  desc: null
+  value: 0
+bad_words_ids:
+  desc: null
+  value: null
+num_return_sequences:
+  desc: null
+  value: 1
+output_scores:
+  desc: null
+  value: false
+return_dict_in_generate:
+  desc: null
+  value: false
+forced_bos_token_id:
+  desc: null
+  value: null
+forced_eos_token_id:
+  desc: null
+  value: null
+remove_invalid_values:
+  desc: null
+  value: false
+exponential_decay_length_penalty:
+  desc: null
+  value: null
+suppress_tokens:
+  desc: null
+  value: null
+begin_suppress_tokens:
+  desc: null
+  value: null
+architectures:
+  desc: null
+  value:
+  - Qwen2ForCausalLM
+finetuning_task:
+  desc: null
+  value: null
+id2label:
+  desc: null
+  value:
+    '0': LABEL_0
+    '1': LABEL_1
+label2id:
+  desc: null
+  value:
+    LABEL_0: 0
+    LABEL_1: 1
+tokenizer_class:
+  desc: null
+  value: null
+prefix:
+  desc: null
+  value: null
+bos_token_id:
+  desc: null
+  value: null
+pad_token_id:
+  desc: null
+  value: 151643
+eos_token_id:
+  desc: null
+  value: 151645
+sep_token_id:
+  desc: null
+  value: null
+decoder_start_token_id:
+  desc: null
+  value: null
+task_specific_params:
+  desc: null
+  value: null
+problem_type:
+  desc: null
+  value: null
+_name_or_path:
+  desc: null
+  value: Qwen/Qwen2.5-Coder-7B-Instruct
+_attn_implementation_autoset:
+  desc: null
+  value: true
+transformers_version:
+  desc: null
+  value: 4.46.0
+model_type:
+  desc: null
+  value: qwen2
+overwrite_output_dir:
+  desc: null
+  value: false
+do_train:
+  desc: null
+  value: false
+do_eval:
+  desc: null
+  value: true
+do_predict:
+  desc: null
+  value: false
+eval_strategy:
+  desc: null
+  value: steps
+prediction_loss_only:
+  desc: null
+  value: false
+per_device_train_batch_size:
+  desc: null
+  value: 8
+per_device_eval_batch_size:
+  desc: null
+  value: 8
+per_gpu_train_batch_size:
+  desc: null
+  value: null
+per_gpu_eval_batch_size:
+  desc: null
+  value: null
+eval_accumulation_steps:
+  desc: null
+  value: null
+eval_delay:
+  desc: null
+  value: 0
+torch_empty_cache_steps:
+  desc: null
+  value: null
+learning_rate:
+  desc: null
+  value: 1.0e-05
+adam_beta1:
+  desc: null
+  value: 0.9
+adam_beta2:
+  desc: null
+  value: 0.999
+adam_epsilon:
+  desc: null
+  value: 1.0e-08
+max_grad_norm:
+  desc: null
+  value: 1.0
+max_steps:
+  desc: null
+  value: -1
+lr_scheduler_type:
+  desc: null
+  value: cosine
+lr_scheduler_kwargs:
+  desc: null
+  value: {}
+warmup_ratio:
+  desc: null
+  value: 0.0
+warmup_steps:
+  desc: null
+  value: 0
+log_level_replica:
+  desc: null
+  value: warning
+log_on_each_node:
+  desc: null
+  value: true
+logging_dir:
+  desc: null
+  value: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/runs/Nov13_17-09-37_algo-1
+logging_strategy:
+  desc: null
+  value: steps
+logging_first_step:
+  desc: null
+  value: true
+logging_nan_inf_filter:
+  desc: null
+  value: true
+save_strategy:
+  desc: null
+  value: epoch
+save_total_limit:
+  desc: null
+  value: null
+save_safetensors:
+  desc: null
+  value: true
+save_on_each_node:
+  desc: null
+  value: false
+save_only_model:
+  desc: null
+  value: false
+restore_callback_states_from_checkpoint:
+  desc: null
+  value: false
+no_cuda:
+  desc: null
+  value: false
+use_cpu:
+  desc: null
+  value: false
+use_mps_device:
+  desc: null
+  value: false
+seed:
+  desc: null
+  value: 42
+data_seed:
+  desc: null
+  value: null
+jit_mode_eval:
+  desc: null
+  value: false
+use_ipex:
+  desc: null
+  value: false
+bf16:
+  desc: null
+  value: false
+fp16:
+  desc: null
+  value: false
+fp16_opt_level:
+  desc: null
+  value: O1
+half_precision_backend:
+  desc: null
+  value: auto
+bf16_full_eval:
+  desc: null
+  value: false
+fp16_full_eval:
+  desc: null
+  value: false
+tf32:
+  desc: null
+  value: null
+local_rank:
+  desc: null
+  value: 0
+ddp_backend:
+  desc: null
+  value: null
+tpu_num_cores:
+  desc: null
+  value: null
+tpu_metrics_debug:
+  desc: null
+  value: false
+debug:
+  desc: null
+  value: []
+dataloader_drop_last:
+  desc: null
+  value: false
+eval_steps:
+  desc: null
+  value: 5
+dataloader_num_workers:
+  desc: null
+  value: 0
+dataloader_prefetch_factor:
+  desc: null
+  value: null
+past_index:
+  desc: null
+  value: -1
+disable_tqdm:
+  desc: null
+  value: false
+remove_unused_columns:
+  desc: null
+  value: true
+label_names:
+  desc: null
+  value: null
+load_best_model_at_end:
+  desc: null
+  value: false
+metric_for_best_model:
+  desc: null
+  value: null
+greater_is_better:
+  desc: null
+  value: null
+ignore_data_skip:
+  desc: null
+  value: false
+fsdp:
+  desc: null
+  value:
+  - full_shard
+  - auto_wrap
+fsdp_min_num_params:
+  desc: null
+  value: 0
+fsdp_config:
+  desc: null
+  value:
+    activation_checkpointing: false
+    auto_wrap_policy: TRANSFORMER_BASED_WRAP
+    backward_prefetch: BACKWARD_PRE
+    cpu_ram_efficient_loading: true
+    forward_prefetch: false
+    offload_params: false
+    sharding_strategy: FULL_SHARD
+    state_dict_type: FULL_STATE_DICT
+    sync_module_states: true
+    min_num_params: 0
+    xla: false
+    xla_fsdp_v2: false
+    xla_fsdp_grad_ckpt: false
+fsdp_transformer_layer_cls_to_wrap:
+  desc: null
+  value: null
+accelerator_config:
+  desc: null
+  value:
+    split_batches: false
+    dispatch_batches: null
+    even_batches: true
+    use_seedable_sampler: true
+    non_blocking: false
+    gradient_accumulation_kwargs: null
+deepspeed:
+  desc: null
+  value: null
+label_smoothing_factor:
+  desc: null
+  value: 0.0
+optim:
+  desc: null
+  value: adamw_torch
+optim_args:
+  desc: null
+  value: null
+adafactor:
+  desc: null
+  value: false
+group_by_length:
+  desc: null
+  value: false
+length_column_name:
+  desc: null
+  value: length
+report_to:
+  desc: null
+  value:
+  - wandb
+ddp_find_unused_parameters:
+  desc: null
+  value: null
+ddp_bucket_cap_mb:
+  desc: null
+  value: null
+ddp_broadcast_buffers:
+  desc: null
+  value: null
+dataloader_pin_memory:
+  desc: null
+  value: true
+dataloader_persistent_workers:
+  desc: null
+  value: false
+skip_memory_metrics:
+  desc: null
+  value: true
+use_legacy_prediction_loop:
+  desc: null
+  value: false
+resume_from_checkpoint:
+  desc: null
+  value: null
+hub_model_id:
+  desc: null
+  value: sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_
+hub_strategy:
+  desc: null
+  value: every_save
+hub_token:
+  desc: null
+  value: <HUB_TOKEN>
+hub_private_repo:
+  desc: null
+  value: false
+hub_always_push:
+  desc: null
+  value: false
+gradient_checkpointing:
+  desc: null
+  value: false
+gradient_checkpointing_kwargs:
+  desc: null
+  value:
+    use_reentrant: false
+include_inputs_for_metrics:
+  desc: null
+  value: false
+include_for_metrics:
+  desc: null
+  value: []
+eval_do_concat_batches:
+  desc: null
+  value: true
+fp16_backend:
+  desc: null
+  value: auto
+evaluation_strategy:
+  desc: null
+  value: null
+push_to_hub_model_id:
+  desc: null
+  value: null
+push_to_hub_organization:
+  desc: null
+  value: null
+push_to_hub_token:
+  desc: null
+  value: <PUSH_TO_HUB_TOKEN>
+mp_parameters:
+  desc: null
+  value: ''
+auto_find_batch_size:
+  desc: null
+  value: false
+full_determinism:
+  desc: null
+  value: false
+torchdynamo:
+  desc: null
+  value: null
+ray_scope:
+  desc: null
+  value: last
+ddp_timeout:
+  desc: null
+  value: 1800
+torch_compile:
+  desc: null
+  value: false
+torch_compile_backend:
+  desc: null
+  value: null
+torch_compile_mode:
+  desc: null
+  value: null
+dispatch_batches:
+  desc: null
+  value: null
+split_batches:
+  desc: null
+  value: null
+include_tokens_per_second:
+  desc: null
+  value: false
+include_num_input_tokens_seen:
+  desc: null
+  value: false
+neftune_noise_alpha:
+  desc: null
+  value: null
+optim_target_modules:
+  desc: null
+  value: null
+batch_eval_metrics:
+  desc: null
+  value: false
+eval_on_start:
+  desc: null
+  value: false
+use_liger_kernel:
+  desc: null
+  value: false
+eval_use_gather_object:
+  desc: null
+  value: false
+dataset_text_field:
+  desc: null
+  value: text
+packing:
+  desc: null
+  value: false
+dataset_num_proc:
+  desc: null
+  value: null
+dataset_batch_size:
+  desc: null
+  value: 64
+model_init_kwargs:
+  desc: null
+  value: null
+dataset_kwargs:
+  desc: null
+  value: {}
+eval_packing:
+  desc: null
+  value: null
+num_of_sequences:
+  desc: null
+  value: 1024
+chars_per_token:
+  desc: null
+  value: <CHARS_PER_TOKEN>
+use_liger:
+  desc: null
+  value: false
+model/num_parameters:
+  desc: null
+  value: 951599936

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch ADDED Viewed

	@@ -0,0 +1,49 @@

+diff --git a/qlearning_reasoning/training/sft.py b/qlearning_reasoning/training/sft.py
+index 583fba2..1c2b359 100644
+--- a/qlearning_reasoning/training/sft.py
++++ b/qlearning_reasoning/training/sft.py
+@@ -51,6 +51,7 @@ flags.DEFINE_string('fsdp', "full_shard auto_wrap", 'If to use FSDP')
+ flags.DEFINE_string('fsdp_config', "qlearning_reasoning/accelerate_configs/fsdp_config.json", 'FSDP config to use.')
+ flags.DEFINE_boolean("push_to_hub", False, "Should the model be uploaded to Huggingface hub?")
+ flags.DEFINE_boolean('add_step_tokens', True, 'Add step tokens')
++flags.DEFINE_string("hub_model_id", None, "Hub model id. If not defined it will be truncated run name.")
+ START_OF_STEP_TOKEN = '[STEP]'
+ END_OF_STEP_TOKEN = '[/STEP]'
+@@ -60,6 +61,10 @@ START_OF_REVISION_TOKEN = '[REVISION]'
+ END_OF_REVISION_TOKEN = '[/REVISION]'
+ def main(_):
++
++    if FLAGS.hub_model_id is None:
++        FLAGS.hub_model_id = FLAGS.run_name[:96]
++
+     if not os.path.exists(FLAGS.output_dir):
+         os.makedirs(FLAGS.output_dir, exist_ok=True)
+         os.makedirs(f"{FLAGS.output_dir}/{FLAGS.run_name}", exist_ok=True)
+@@ -219,11 +224,11 @@ def main(_):
+         optim=FLAGS.optim,
+         weight_decay=FLAGS.weight_decay,
+         warmup_steps=FLAGS.warmup_steps,
+-        max_steps=num_steps,
+         fsdp=FLAGS.fsdp,
+         fsdp_config=FLAGS.fsdp_config if FLAGS.fsdp != '' else None,
+         push_to_hub=FLAGS.push_to_hub,
+         num_train_epochs=num_train_epochs,
++        hub_model_id=FLAGS.hub_model_id
+     )
+     flags_dict = FLAGS.flag_values_dict()
+diff --git a/sagemaker/launch_sagemaker.py b/sagemaker/launch_sagemaker.py
+index 3316ede..98ed205 100644
+--- a/sagemaker/launch_sagemaker.py
++++ b/sagemaker/launch_sagemaker.py
+@@ -224,7 +224,7 @@ def main(argv):
+     # TODO: verify if this breaks the code
+     environment = {
+         "PYTHONPATH": "/opt/ml/code/qlearning_reasoning/",
+-        "HF_HOME": "/opt/ml/input/data/training/hf-cache",
++        "HF_HOME": "/opt/ml/data/input/.cache",
+         "HF_TOKEN": get_hf_token(),
+         "WANDB_API_KEY": get_wandb_api_key(),
+         "SM_USE_RESERVED_CAPACITY": "1",

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log ADDED Viewed

The diff for this file is too large to render. See raw diff

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/requirements.txt ADDED Viewed

	@@ -0,0 +1,289 @@

+absl-py==2.1.0
+accelerate==1.1.1
+aiohappyeyeballs==2.4.3
+aiohttp==3.10.10
+aiosignal==1.3.1
+annotated-types==0.7.0
+antlr4-python3-runtime==4.9.3
+apex==0.1
+appdirs==1.4.4
+argparse==1.4.0
+asttokens==2.4.1
+async-timeout==4.0.3
+attrdict==2.0.1
+attrs==23.2.0
+autocommand==2.2.2
+awscli==1.33.40
+backcall==0.2.0
+backports.tarfile==1.2.0
+bcrypt==4.2.0
+beautifulsoup4==4.12.3
+bleach==6.2.0
+blis==0.7.10
+bokeh==3.5.1
+boltons==23.0.0
+boto3==1.34.158
+botocore==1.34.158
+brotli==1.0.9
+cached-property==1.5.2
+cachetools==5.5.0
+catalogue==2.0.10
+certifi==2024.7.4
+cffi==1.15.1
+chardet==5.2.0
+charset-normalizer==3.2.0
+click==8.1.7
+cloudpathlib==0.18.1
+cloudpickle==2.2.1
+cmake==3.30.2
+colorama==0.4.6
+comm==0.2.2
+conda-libmamba-solver==23.3.0
+conda-package-handling==2.2.0
+conda-package-streaming==0.9.0
+conda==23.3.1
+confection==0.1.4
+contourpy==1.2.1
+cryptography==41.0.7
+cycler==0.12.1
+cymem==2.0.8
+cython==3.0.11
+datasets==3.1.0
+debugpy==1.8.5
+decorator==5.1.1
+defusedxml==0.7.1
+dill==0.3.8
+docker-pycreds==0.4.0
+docker==7.1.0
+docopt==0.6.2
+docstring-parser==0.16
+docutils==0.16
+einops==0.8.0
+exceptiongroup==1.2.2
+executing==2.0.1
+fastai==2.7.16
+fastcore==1.5.55
+fastdownload==0.0.7
+fastjsonschema==2.20.0
+fastprogress==1.0.3
+filelock==3.15.4
+fire==0.6.0
+flash-attn==2.5.5
+fonttools==4.53.1
+frozenlist==1.5.0
+fsspec==2024.6.1
+gevent==24.2.1
+gitdb==4.0.11
+gitpython==3.1.43
+gmpy2==2.1.5
+google-pasta==0.2.0
+greenlet==3.0.3
+h5py==3.11.0
+huggingface-hub==0.26.2
+hydra-core==1.3.2
+idna==3.7
+imageio==2.34.2
+importlib-metadata==6.11.0
+importlib-resources==6.1.1
+inflect==7.3.1
+inotify-simple==1.2.1
+ipykernel==6.29.1
+ipython==8.12.3
+jaraco.context==5.3.0
+jaraco.functools==4.0.1
+jaraco.text==3.12.1
+jedi==0.19.1
+jinja2==3.1.4
+jmespath==1.0.1
+joblib==1.4.2
+jsonpatch==1.32
+jsonpointer==2.0
+jsonschema-specifications==2023.12.1
+jsonschema==4.23.0
+jupyter-client==8.6.2
+jupyter-core==5.7.2
+jupyterlab-pygments==0.3.0
+kiwisolver==1.4.5
+langcodes==3.4.0
+language-data==1.2.0
+libmambapy==1.4.2
+llvmlite==0.43.0
+mamba==1.4.2
+marisa-trie==1.1.0
+markdown-it-py==3.0.0
+markupsafe==2.1.5
+matplotlib-inline==0.1.7
+matplotlib==3.9.1
+mdurl==0.1.2
+mistune==3.0.2
+more-itertools==10.3.0
+mpi4py==3.1.6
+mpmath==1.3.0
+multidict==6.1.0
+multiprocess==0.70.16
+munkres==1.1.4
+murmurhash==1.0.10
+nbclient==0.10.0
+nbconvert==7.16.4
+nbformat==5.10.4
+nest-asyncio==1.6.0
+networkx==3.3
+ninja==1.11.1.1
+numba==0.60.0
+numpy==1.24.3
+nvidia-cublas-cu12==12.1.3.1
+nvidia-cuda-cupti-cu12==12.1.105
+nvidia-cuda-nvrtc-cu12==12.1.105
+nvidia-cuda-runtime-cu12==12.1.105
+nvidia-cudnn-cu12==8.9.2.26
+nvidia-cufft-cu12==11.0.2.54
+nvidia-curand-cu12==10.3.2.106
+nvidia-cusolver-cu12==11.4.5.107
+nvidia-cusparse-cu12==12.1.0.106
+nvidia-ml-py==12.535.161
+nvidia-nccl-cu12==2.19.3
+nvidia-nvjitlink-cu12==12.6.77
+nvidia-nvtx-cu12==12.1.105
+nvitop==1.3.2
+omegaconf==2.3.0
+opencv-python==4.10.0.84
+ordered-set==4.1.0
+packaging==23.1
+pandas==2.2.2
+pandocfilters==1.5.1
+paramiko==3.4.0
+parso==0.8.4
+pathos==0.3.2
+pexpect==4.9.0
+pickleshare==0.7.5
+pillow==10.3.0
+pip-chill==1.0.3
+pip==24.1.2
+pipreqs==0.5.0
+platformdirs==4.2.2
+plotly==5.23.0
+pluggy==1.3.0
+ply==3.11
+pox==0.3.4
+ppft==1.7.6.8
+preshed==3.0.9
+prompt-toolkit==3.0.47
+propcache==0.2.0
+protobuf==3.20.3
+psutil==6.0.0
+ptyprocess==0.7.0
+pure-eval==0.2.3
+pyarrow==17.0.0
+pyasn1==0.6.0
+pybind11-global==2.13.1
+pybind11==2.13.1
+pycosat==0.6.4
+pycparser==2.21
+pydantic-core==2.20.1
+pydantic==2.8.2
+pyfunctional==1.5.0
+pygments==2.18.0
+pynacl==1.5.0
+pyopenssl==23.2.0
+pyparsing==3.1.2
+pyqt5-sip==12.12.2
+pyqt5==5.15.9
+pysocks==1.7.1
+python-dateutil==2.9.0
+pytz==2024.1
+pyyaml==6.0.2
+pyzmq==26.1.0
+referencing==0.35.1
+regex==2024.11.6
+requests==2.32.3
+retrying==1.3.4
+rich==13.7.1
+rpds-py==0.20.0
+rsa==4.7.2
+ruamel.yaml.clib==0.2.7
+ruamel.yaml==0.17.32
+s3fs==0.4.2
+s3transfer==0.10.2
+safetensors==0.4.5
+sagemaker-experiments==0.1.45
+sagemaker-pytorch-training==2.8.1
+sagemaker-training==4.8.1
+sagemaker==2.224.2
+schema==0.7.7
+scikit-learn==1.3.2
+scipy==1.14.0
+seaborn==0.13.2
+sentencepiece==0.2.0
+sentry-sdk==2.18.0
+setproctitle==1.3.3
+setuptools==72.1.0
+shap==0.46.0
+shellingham==1.5.4
+shtab==1.7.1
+sip==6.7.12
+six==1.16.0
+slicer==0.0.8
+smart-open==7.0.4
+smclarify==0.5
+smdebug-rulesconfig==1.0.1
+smdistributed-dataparallel==2.1.0
+smmap==5.0.1
+smprof==0.3.334
+soupsieve==2.6
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+spacy==3.7.5
+srsly==2.4.8
+stack-data==0.6.2
+sympy==1.13.0
+tabulate==0.9.0
+tblib==3.0.0
+tenacity==9.0.0
+tensor-parallel==2.0.0
+termcolor==2.5.0
+thinc==8.2.5
+threadpoolctl==3.5.0
+tinycss2==1.4.0
+tokenizers==0.20.3
+toml==0.10.2
+tomli==2.0.1
+toolz==0.12.0
+torch==2.2.0
+torchaudio==2.2.0
+torchdata==0.7.0
+torchnet==0.0.4
+torchtext==0.16.0
+torchvision==0.17.0
+tornado==6.4.1
+tqdm==4.66.5
+traitlets==5.14.3
+transformer-engine==0.12.0+170797
+transformers==4.46.0
+triton==2.2.0
+trl==0.12.0
+typeguard==4.3.0
+typer-slim==0.12.3
+typer==0.12.3
+typing-extensions==4.12.2
+tyro==0.8.5
+tzdata==2024.1
+unicodedata2==15.1.0
+urllib3==1.26.19
+visdom==0.2.4
+wandb==0.16.3
+wasabi==1.1.2
+wcwidth==0.2.13
+weasel==0.4.1
+webencodings==0.5.1
+websocket-client==1.8.0
+werkzeug==3.0.3
+wheel==0.41.2
+wrapt==1.16.0
+xxhash==3.5.0
+xyzservices==2024.6.0
+yarg==0.1.9
+yarl==1.17.1
+zipp==3.19.2
+zope.event==5.0
+zope.interface==7.0.1
+zstandard==0.19.0

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-metadata.json ADDED Viewed

	@@ -0,0 +1,1069 @@

+{
+    "os": "Linux-5.10.226-214.879.amzn2.x86_64-x86_64-with-glibc2.31",
+    "python": "3.10.12",
+    "heartbeatAt": "2024-11-13T17:10:07.993791",
+    "startedAt": "2024-11-13T17:10:07.428221",
+    "docker": null,
+    "cuda": null,
+    "args": [
+        "--batch_size",
+        "64",
+        "--cache_dir",
+        "/opt/ml/data/input/.cache",
+        "--dataset",
+        "code-contests",
+        "--gradient_accumulation_steps",
+        "8",
+        "--logging_steps",
+        "5",
+        "--lr",
+        "1e-5",
+        "--max_seq_length",
+        "2048",
+        "--model_name",
+        "Qwen/Qwen2.5-Coder-7B-Instruct",
+        "--num_train_epochs",
+        "2",
+        "--output_dir",
+        "/opt/ml/model/",
+        "--push_to_hub",
+        "True",
+        "--run_name",
+        "sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048",
+        "--save_steps",
+        "100",
+        "--schedule",
+        "cosine",
+        "--wandb_project",
+        "sft-codecontests-1112",
+        "--weight_decay",
+        "0.0"
+    ],
+    "state": "running",
+    "program": "/opt/ml/code/qlearning_reasoning/training/sft.py",
+    "codePathLocal": "qlearning_reasoning/training/sft.py",
+    "codePath": "qlearning_reasoning/training/sft.py",
+    "git": {
+        "remote": "[email protected]:TRI-ML/reasoning-value-verifiers.git",
+        "commit": "cbfd05147f15c55be83f4996eebdb305c17f119d"
+    },
+    "email": null,
+    "root": "/opt/ml/code",
+    "host": "algo-1",
+    "username": "root",
+    "executable": "/opt/conda/bin/python3.10",
+    "cpu_count": 96,
+    "cpu_count_logical": 192,
+    "cpu_freq": {
+        "current": 2807.4830677083337,
+        "min": 0.0,
+        "max": 0.0
+    },
+    "cpu_freq_per_core": [
+        {
+            "current": 3476.342,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3247.882,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2904.031,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3109.433,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3599.377,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3103.902,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3160.704,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2903.061,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3151.516,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3220.914,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3113.9,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3599.288,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3149.924,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3195.68,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3273.352,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3152.916,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2940.821,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2997.447,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2722.682,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2960.205,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3014.718,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2865.342,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2643.892,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2626.179,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3181.377,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3271.231,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3187.187,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3199.812,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3207.165,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3251.62,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.089,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3222.446,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.008,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3199.923,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3328.709,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3189.821,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3176.968,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3170.487,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3186.086,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3216.688,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3594.347,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3039.479,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3486.888,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3343.804,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3238.757,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2966.737,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3348.466,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2907.859,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3002.238,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2217.1,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2241.607,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2684.27,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2719.247,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2783.971,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2773.016,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3086.799,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2611.966,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2540.393,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2541.301,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2543.134,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1889.373,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2536.698,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1960.209,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1871.901,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2935.658,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2920.588,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.066,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3324.97,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3298.432,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3404.565,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2925.92,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3278.833,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2607.119,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1884.144,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2516.733,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1885.068,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 1881.651,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2500.279,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2519.44,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2497.886,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3376.996,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3262.597,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3258.462,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3243.917,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3263.253,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3596.819,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3251.877,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3453.493,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.538,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3252.456,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3235.472,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3258.914,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3221.932,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3223.056,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2916.257,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3221.381,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3249.041,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3158.094,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3117.532,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3180.319,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.35,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2902.289,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3193.614,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3132.908,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3221.533,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3082.135,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3036.898,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3596.595,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3185.956,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3178.002,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3186.383,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3138.284,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2890.053,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2878.155,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2943.671,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2924.089,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2461.058,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2961.225,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3097.346,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2638.607,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3267.369,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3301.989,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3255.895,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3305.783,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3320.452,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3278.446,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3598.093,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3266.814,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3596.43,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3270.648,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3505.783,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3297.048,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3264.728,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3224.761,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3342.449,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3342.148,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3597.921,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3251.183,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3533.37,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3446.582,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3261.516,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3254.535,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3261.428,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3262.921,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3276.045,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3266.835,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2751.168,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3167.713,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3180.263,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3203.948,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3234.562,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3486.665,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2789.289,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2859.707,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3143.341,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3089.871,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2266.761,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2745.206,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2832.943,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2820.125,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3202.152,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3127.913,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3598.345,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3220.73,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3025.305,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3391.839,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3119.74,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3231.315,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2396.33,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2423.797,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2527.72,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2467.572,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2425.179,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2028.21,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2503.85,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 2452.12,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3075.121,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3222.332,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3233.386,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3200.352,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3202.276,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3598.346,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3254.354,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3379.901,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3594.797,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3225.912,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3223.292,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3225.046,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3214.566,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3280.304,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3169.07,
+            "min": 0.0,
+            "max": 0.0
+        },
+        {
+            "current": 3225.192,
+            "min": 0.0,
+            "max": 0.0
+        }
+    ],
+    "disk": {
+        "/": {
+            "total": 119.94140625,
+            "used": 56.40110397338867
+        }
+    },
+    "gpu": "NVIDIA H100 80GB HBM3",
+    "gpu_count": 8,
+    "gpu_devices": [
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        },
+        {
+            "name": "NVIDIA H100 80GB HBM3",
+            "memory_total": 85520809984
+        }
+    ],
+    "memory": {
+        "total": 1999.9661331176758
+    }
+}

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"train/loss": 0.7172, "train/grad_norm": 0.341796875, "train/learning_rate": 3.0865828381745515e-06, "train/epoch": 1.22, "train/global_step": 15, "_timestamp": 1731518293.2375202, "_runtime": 485.8045001029968, "_step": 6, "eval/loss": 0.6777312159538269, "eval/runtime": 1.6459, "eval/samples_per_second": 61.97, "eval/steps_per_second": 1.215}

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug-internal.log ADDED Viewed

	@@ -0,0 +1,373 @@

+2024-11-13 17:10:07,434 INFO    StreamThr :1939 [internal.py:wandb_internal():86] W&B internal server running at pid: 1939, started at: 2024-11-13 17:10:07.433254
+2024-11-13 17:10:07,435 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status
+2024-11-13 17:10:07,436 INFO    WriterThread:1939 [datastore.py:open_for_write():87] open: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/run-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1.wandb
+2024-11-13 17:10:07,437 DEBUG   SenderThread:1939 [sender.py:send():382] send: header
+2024-11-13 17:10:07,443 DEBUG   SenderThread:1939 [sender.py:send():382] send: run
+2024-11-13 17:10:07,751 INFO    SenderThread:1939 [dir_watcher.py:__init__():211] watching files in: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files
+2024-11-13 17:10:07,751 INFO    SenderThread:1939 [sender.py:_start_run_threads():1136] run started: kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1 with start time 1731517807.43302
+2024-11-13 17:10:07,759 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: check_version
+2024-11-13 17:10:07,760 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: check_version
+2024-11-13 17:10:07,839 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: run_start
+2024-11-13 17:10:07,929 DEBUG   HandlerThread:1939 [system_info.py:__init__():27] System info init
+2024-11-13 17:10:07,929 DEBUG   HandlerThread:1939 [system_info.py:__init__():42] System info init done
+2024-11-13 17:10:07,929 INFO    HandlerThread:1939 [system_monitor.py:start():194] Starting system monitor
+2024-11-13 17:10:07,929 INFO    SystemMonitor:1939 [system_monitor.py:_start():158] Starting system asset monitoring threads
+2024-11-13 17:10:07,930 INFO    HandlerThread:1939 [system_monitor.py:probe():214] Collecting system info
+2024-11-13 17:10:07,930 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started cpu monitoring
+2024-11-13 17:10:07,931 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started disk monitoring
+2024-11-13 17:10:07,932 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started gpu monitoring
+2024-11-13 17:10:07,933 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started memory monitoring
+2024-11-13 17:10:07,933 INFO    SystemMonitor:1939 [interfaces.py:start():190] Started network monitoring
+2024-11-13 17:10:07,993 DEBUG   HandlerThread:1939 [system_info.py:probe():151] Probing system
+2024-11-13 17:10:07,996 DEBUG   HandlerThread:1939 [system_info.py:_probe_git():136] Probing git
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_info.py:_probe_git():144] Probing git done
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_info.py:probe():199] Probing system done
+2024-11-13 17:10:08,005 DEBUG   HandlerThread:1939 [system_monitor.py:probe():223] {'os': 'Linux-5.10.226-214.879.amzn2.x86_64-x86_64-with-glibc2.31', 'python': '3.10.12', 'heartbeatAt': '2024-11-13T17:10:07.993791', 'startedAt': '2024-11-13T17:10:07.428221', 'docker': None, 'cuda': None, 'args': ('--batch_size', '64', '--cache_dir', '/opt/ml/data/input/.cache', '--dataset', 'code-contests', '--gradient_accumulation_steps', '8', '--logging_steps', '5', '--lr', '1e-5', '--max_seq_length', '2048', '--model_name', 'Qwen/Qwen2.5-Coder-7B-Instruct', '--num_train_epochs', '2', '--output_dir', '/opt/ml/model/', '--push_to_hub', 'True', '--run_name', 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', '--save_steps', '100', '--schedule', 'cosine', '--wandb_project', 'sft-codecontests-1112', '--weight_decay', '0.0'), 'state': 'running', 'program': '/opt/ml/code/qlearning_reasoning/training/sft.py', 'codePathLocal': 'qlearning_reasoning/training/sft.py', 'codePath': 'qlearning_reasoning/training/sft.py', 'git': {'remote': '[email protected]:TRI-ML/reasoning-value-verifiers.git', 'commit': 'cbfd05147f15c55be83f4996eebdb305c17f119d'}, 'email': None, 'root': '/opt/ml/code', 'host': 'algo-1', 'username': 'root', 'executable': '/opt/conda/bin/python3.10', 'cpu_count': 96, 'cpu_count_logical': 192, 'cpu_freq': {'current': 2807.4830677083337, 'min': 0.0, 'max': 0.0}, 'cpu_freq_per_core': [{'current': 3476.342, 'min': 0.0, 'max': 0.0}, {'current': 3247.882, 'min': 0.0, 'max': 0.0}, {'current': 2904.031, 'min': 0.0, 'max': 0.0}, {'current': 3109.433, 'min': 0.0, 'max': 0.0}, {'current': 3599.377, 'min': 0.0, 'max': 0.0}, {'current': 3103.902, 'min': 0.0, 'max': 0.0}, {'current': 3160.704, 'min': 0.0, 'max': 0.0}, {'current': 2903.061, 'min': 0.0, 'max': 0.0}, {'current': 3151.516, 'min': 0.0, 'max': 0.0}, {'current': 3220.914, 'min': 0.0, 'max': 0.0}, {'current': 3113.9, 'min': 0.0, 'max': 0.0}, {'current': 3599.288, 'min': 0.0, 'max': 0.0}, {'current': 3149.924, 'min': 0.0, 'max': 0.0}, {'current': 3195.68, 'min': 0.0, 'max': 0.0}, {'current': 3273.352, 'min': 0.0, 'max': 0.0}, {'current': 3152.916, 'min': 0.0, 'max': 0.0}, {'current': 2940.821, 'min': 0.0, 'max': 0.0}, {'current': 2997.447, 'min': 0.0, 'max': 0.0}, {'current': 2722.682, 'min': 0.0, 'max': 0.0}, {'current': 2960.205, 'min': 0.0, 'max': 0.0}, {'current': 3014.718, 'min': 0.0, 'max': 0.0}, {'current': 2865.342, 'min': 0.0, 'max': 0.0}, {'current': 2643.892, 'min': 0.0, 'max': 0.0}, {'current': 2626.179, 'min': 0.0, 'max': 0.0}, {'current': 3181.377, 'min': 0.0, 'max': 0.0}, {'current': 3271.231, 'min': 0.0, 'max': 0.0}, {'current': 3187.187, 'min': 0.0, 'max': 0.0}, {'current': 3199.812, 'min': 0.0, 'max': 0.0}, {'current': 3207.165, 'min': 0.0, 'max': 0.0}, {'current': 3251.62, 'min': 0.0, 'max': 0.0}, {'current': 3597.089, 'min': 0.0, 'max': 0.0}, {'current': 3222.446, 'min': 0.0, 'max': 0.0}, {'current': 3597.008, 'min': 0.0, 'max': 0.0}, {'current': 3199.923, 'min': 0.0, 'max': 0.0}, {'current': 3328.709, 'min': 0.0, 'max': 0.0}, {'current': 3189.821, 'min': 0.0, 'max': 0.0}, {'current': 3176.968, 'min': 0.0, 'max': 0.0}, {'current': 3170.487, 'min': 0.0, 'max': 0.0}, {'current': 3186.086, 'min': 0.0, 'max': 0.0}, {'current': 3216.688, 'min': 0.0, 'max': 0.0}, {'current': 3594.347, 'min': 0.0, 'max': 0.0}, {'current': 3039.479, 'min': 0.0, 'max': 0.0}, {'current': 3486.888, 'min': 0.0, 'max': 0.0}, {'current': 3343.804, 'min': 0.0, 'max': 0.0}, {'current': 3238.757, 'min': 0.0, 'max': 0.0}, {'current': 2966.737, 'min': 0.0, 'max': 0.0}, {'current': 3348.466, 'min': 0.0, 'max': 0.0}, {'current': 2907.859, 'min': 0.0, 'max': 0.0}, {'current': 3002.238, 'min': 0.0, 'max': 0.0}, {'current': 2217.1, 'min': 0.0, 'max': 0.0}, {'current': 2241.607, 'min': 0.0, 'max': 0.0}, {'current': 2684.27, 'min': 0.0, 'max': 0.0}, {'current': 2719.247, 'min': 0.0, 'max': 0.0}, {'current': 2783.971, 'min': 0.0, 'max': 0.0}, {'current': 2773.016, 'min': 0.0, 'max': 0.0}, {'current': 3086.799, 'min': 0.0, 'max': 0.0}, {'current': 2611.966, 'min': 0.0, 'max': 0.0}, {'current': 2540.393, 'min': 0.0, 'max': 0.0}, {'current': 2541.301, 'min': 0.0, 'max': 0.0}, {'current': 2543.134, 'min': 0.0, 'max': 0.0}, {'current': 1889.373, 'min': 0.0, 'max': 0.0}, {'current': 2536.698, 'min': 0.0, 'max': 0.0}, {'current': 1960.209, 'min': 0.0, 'max': 0.0}, {'current': 1871.901, 'min': 0.0, 'max': 0.0}, {'current': 2935.658, 'min': 0.0, 'max': 0.0}, {'current': 2920.588, 'min': 0.0, 'max': 0.0}, {'current': 3597.066, 'min': 0.0, 'max': 0.0}, {'current': 3324.97, 'min': 0.0, 'max': 0.0}, {'current': 3298.432, 'min': 0.0, 'max': 0.0}, {'current': 3404.565, 'min': 0.0, 'max': 0.0}, {'current': 2925.92, 'min': 0.0, 'max': 0.0}, {'current': 3278.833, 'min': 0.0, 'max': 0.0}, {'current': 2607.119, 'min': 0.0, 'max': 0.0}, {'current': 1884.144, 'min': 0.0, 'max': 0.0}, {'current': 2516.733, 'min': 0.0, 'max': 0.0}, {'current': 1885.068, 'min': 0.0, 'max': 0.0}, {'current': 1881.651, 'min': 0.0, 'max': 0.0}, {'current': 2500.279, 'min': 0.0, 'max': 0.0}, {'current': 2519.44, 'min': 0.0, 'max': 0.0}, {'current': 2497.886, 'min': 0.0, 'max': 0.0}, {'current': 3376.996, 'min': 0.0, 'max': 0.0}, {'current': 3262.597, 'min': 0.0, 'max': 0.0}, {'current': 3258.462, 'min': 0.0, 'max': 0.0}, {'current': 3243.917, 'min': 0.0, 'max': 0.0}, {'current': 3263.253, 'min': 0.0, 'max': 0.0}, {'current': 3596.819, 'min': 0.0, 'max': 0.0}, {'current': 3251.877, 'min': 0.0, 'max': 0.0}, {'current': 3453.493, 'min': 0.0, 'max': 0.0}, {'current': 3597.538, 'min': 0.0, 'max': 0.0}, {'current': 3252.456, 'min': 0.0, 'max': 0.0}, {'current': 3235.472, 'min': 0.0, 'max': 0.0}, {'current': 3258.914, 'min': 0.0, 'max': 0.0}, {'current': 3221.932, 'min': 0.0, 'max': 0.0}, {'current': 3223.056, 'min': 0.0, 'max': 0.0}, {'current': 2916.257, 'min': 0.0, 'max': 0.0}, {'current': 3221.381, 'min': 0.0, 'max': 0.0}, {'current': 3249.041, 'min': 0.0, 'max': 0.0}, {'current': 3158.094, 'min': 0.0, 'max': 0.0}, {'current': 3117.532, 'min': 0.0, 'max': 0.0}, {'current': 3180.319, 'min': 0.0, 'max': 0.0}, {'current': 3597.35, 'min': 0.0, 'max': 0.0}, {'current': 2902.289, 'min': 0.0, 'max': 0.0}, {'current': 3193.614, 'min': 0.0, 'max': 0.0}, {'current': 3132.908, 'min': 0.0, 'max': 0.0}, {'current': 3221.533, 'min': 0.0, 'max': 0.0}, {'current': 3082.135, 'min': 0.0, 'max': 0.0}, {'current': 3036.898, 'min': 0.0, 'max': 0.0}, {'current': 3596.595, 'min': 0.0, 'max': 0.0}, {'current': 3185.956, 'min': 0.0, 'max': 0.0}, {'current': 3178.002, 'min': 0.0, 'max': 0.0}, {'current': 3186.383, 'min': 0.0, 'max': 0.0}, {'current': 3138.284, 'min': 0.0, 'max': 0.0}, {'current': 2890.053, 'min': 0.0, 'max': 0.0}, {'current': 2878.155, 'min': 0.0, 'max': 0.0}, {'current': 2943.671, 'min': 0.0, 'max': 0.0}, {'current': 2924.089, 'min': 0.0, 'max': 0.0}, {'current': 2461.058, 'min': 0.0, 'max': 0.0}, {'current': 2961.225, 'min': 0.0, 'max': 0.0}, {'current': 3097.346, 'min': 0.0, 'max': 0.0}, {'current': 2638.607, 'min': 0.0, 'max': 0.0}, {'current': 3267.369, 'min': 0.0, 'max': 0.0}, {'current': 3301.989, 'min': 0.0, 'max': 0.0}, {'current': 3255.895, 'min': 0.0, 'max': 0.0}, {'current': 3305.783, 'min': 0.0, 'max': 0.0}, {'current': 3320.452, 'min': 0.0, 'max': 0.0}, {'current': 3278.446, 'min': 0.0, 'max': 0.0}, {'current': 3598.093, 'min': 0.0, 'max': 0.0}, {'current': 3266.814, 'min': 0.0, 'max': 0.0}, {'current': 3596.43, 'min': 0.0, 'max': 0.0}, {'current': 3270.648, 'min': 0.0, 'max': 0.0}, {'current': 3505.783, 'min': 0.0, 'max': 0.0}, {'current': 3297.048, 'min': 0.0, 'max': 0.0}, {'current': 3264.728, 'min': 0.0, 'max': 0.0}, {'current': 3224.761, 'min': 0.0, 'max': 0.0}, {'current': 3342.449, 'min': 0.0, 'max': 0.0}, {'current': 3342.148, 'min': 0.0, 'max': 0.0}, {'current': 3597.921, 'min': 0.0, 'max': 0.0}, {'current': 3251.183, 'min': 0.0, 'max': 0.0}, {'current': 3533.37, 'min': 0.0, 'max': 0.0}, {'current': 3446.582, 'min': 0.0, 'max': 0.0}, {'current': 3261.516, 'min': 0.0, 'max': 0.0}, {'current': 3254.535, 'min': 0.0, 'max': 0.0}, {'current': 3261.428, 'min': 0.0, 'max': 0.0}, {'current': 3262.921, 'min': 0.0, 'max': 0.0}, {'current': 3276.045, 'min': 0.0, 'max': 0.0}, {'current': 3266.835, 'min': 0.0, 'max': 0.0}, {'current': 2751.168, 'min': 0.0, 'max': 0.0}, {'current': 3167.713, 'min': 0.0, 'max': 0.0}, {'current': 3180.263, 'min': 0.0, 'max': 0.0}, {'current': 3203.948, 'min': 0.0, 'max': 0.0}, {'current': 3234.562, 'min': 0.0, 'max': 0.0}, {'current': 3486.665, 'min': 0.0, 'max': 0.0}, {'current': 2789.289, 'min': 0.0, 'max': 0.0}, {'current': 2859.707, 'min': 0.0, 'max': 0.0}, {'current': 3143.341, 'min': 0.0, 'max': 0.0}, {'current': 3089.871, 'min': 0.0, 'max': 0.0}, {'current': 2266.761, 'min': 0.0, 'max': 0.0}, {'current': 2745.206, 'min': 0.0, 'max': 0.0}, {'current': 2832.943, 'min': 0.0, 'max': 0.0}, {'current': 2820.125, 'min': 0.0, 'max': 0.0}, {'current': 3202.152, 'min': 0.0, 'max': 0.0}, {'current': 3127.913, 'min': 0.0, 'max': 0.0}, {'current': 3598.345, 'min': 0.0, 'max': 0.0}, {'current': 3220.73, 'min': 0.0, 'max': 0.0}, {'current': 3025.305, 'min': 0.0, 'max': 0.0}, {'current': 3391.839, 'min': 0.0, 'max': 0.0}, {'current': 3119.74, 'min': 0.0, 'max': 0.0}, {'current': 3231.315, 'min': 0.0, 'max': 0.0}, {'current': 2396.33, 'min': 0.0, 'max': 0.0}, {'current': 2423.797, 'min': 0.0, 'max': 0.0}, {'current': 2527.72, 'min': 0.0, 'max': 0.0}, {'current': 2467.572, 'min': 0.0, 'max': 0.0}, {'current': 2425.179, 'min': 0.0, 'max': 0.0}, {'current': 2028.21, 'min': 0.0, 'max': 0.0}, {'current': 2503.85, 'min': 0.0, 'max': 0.0}, {'current': 2452.12, 'min': 0.0, 'max': 0.0}, {'current': 3075.121, 'min': 0.0, 'max': 0.0}, {'current': 3222.332, 'min': 0.0, 'max': 0.0}, {'current': 3233.386, 'min': 0.0, 'max': 0.0}, {'current': 3200.352, 'min': 0.0, 'max': 0.0}, {'current': 3202.276, 'min': 0.0, 'max': 0.0}, {'current': 3598.346, 'min': 0.0, 'max': 0.0}, {'current': 3254.354, 'min': 0.0, 'max': 0.0}, {'current': 3379.901, 'min': 0.0, 'max': 0.0}, {'current': 3594.797, 'min': 0.0, 'max': 0.0}, {'current': 3225.912, 'min': 0.0, 'max': 0.0}, {'current': 3223.292, 'min': 0.0, 'max': 0.0}, {'current': 3225.046, 'min': 0.0, 'max': 0.0}, {'current': 3214.566, 'min': 0.0, 'max': 0.0}, {'current': 3280.304, 'min': 0.0, 'max': 0.0}, {'current': 3169.07, 'min': 0.0, 'max': 0.0}, {'current': 3225.192, 'min': 0.0, 'max': 0.0}], 'disk': {'/': {'total': 119.94140625, 'used': 56.40110397338867}}, 'gpu': 'NVIDIA H100 80GB HBM3', 'gpu_count': 8, 'gpu_devices': [{'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 80GB HBM3', 'memory_total': 85520809984}], 'memory': {'total': 1999.9661331176758}}
+2024-11-13 17:10:08,005 INFO    HandlerThread:1939 [system_monitor.py:probe():224] Finished collecting system info
+2024-11-13 17:10:08,005 INFO    HandlerThread:1939 [system_monitor.py:probe():227] Publishing system info
+2024-11-13 17:10:08,006 DEBUG   HandlerThread:1939 [system_info.py:_save_conda():208] Saving list of conda packages installed into the current environment
+2024-11-13 17:10:08,753 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml
+2024-11-13 17:10:22,112 DEBUG   HandlerThread:1939 [system_info.py:_save_conda():220] Saving conda packages done
+2024-11-13 17:10:22,112 DEBUG   HandlerThread:1939 [system_info.py:_save_code():45] Saving code
+2024-11-13 17:10:22,117 DEBUG   HandlerThread:1939 [system_info.py:_save_code():66] Saving code done
+2024-11-13 17:10:22,117 DEBUG   HandlerThread:1939 [system_info.py:_save_patches():83] Saving git patches
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/conda-environment.yaml
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training/sft.py
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch
+2024-11-13 17:10:22,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning/training
+2024-11-13 17:10:22,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code/qlearning_reasoning
+2024-11-13 17:10:22,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/code
+2024-11-13 17:10:22,764 DEBUG   HandlerThread:1939 [system_info.py:_save_patches():125] Saving git patches done
+2024-11-13 17:10:22,766 INFO    HandlerThread:1939 [system_monitor.py:probe():229] Finished publishing system info
+2024-11-13 17:10:22,767 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: keepalive
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,768 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: keepalive
+2024-11-13 17:10:22,768 DEBUG   SenderThread:1939 [sender.py:send():382] send: files
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-metadata.json with policy now
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file code/qlearning_reasoning/training/sft.py with policy now
+2024-11-13 17:10:22,769 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file diff.patch with policy now
+2024-11-13 17:10:22,773 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: python_packages
+2024-11-13 17:10:22,773 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: python_packages
+2024-11-13 17:10:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:22,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:22,923 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,924 DEBUG   SenderThread:1939 [sender.py:send():382] send: config
+2024-11-13 17:10:22,924 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:22,925 WARNING SenderThread:1939 [sender.py:send_metric():1354] Seen metric with glob (shouldn't happen)
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: telemetry
+2024-11-13 17:10:22,925 DEBUG   SenderThread:1939 [sender.py:send():382] send: config
+2024-11-13 17:10:23,079 INFO    wandb-upload_1:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/yx5qp0zp-code/qlearning_reasoning/training/sft.py
+2024-11-13 17:10:23,081 INFO    wandb-upload_0:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/ohhel8zq-wandb-metadata.json
+2024-11-13 17:10:23,084 INFO    wandb-upload_2:1939 [upload_job.py:push():131] Uploaded file /tmp/tmp6y9zx1o1wandb/o4jbd2x2-diff.patch
+2024-11-13 17:10:23,755 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/diff.patch
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/requirements.txt
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:23,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-metadata.json
+2024-11-13 17:10:25,756 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:27,927 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:32,928 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:37,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:38,878 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:39,761 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:10:44,055 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:46,939 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:10:46,941 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:10:46,942 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:10:46,944 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:10:47,764 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:47,765 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_created():271] file/dir created: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:10:49,765 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:10:49,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:10:52,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:10:52,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:10:52,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:10:55,857 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:00,858 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:05,858 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:07,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:07,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:07,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:07,934 DEBUG   SystemMonitor:1939 [system_monitor.py:_start():172] Starting system metrics aggregation loop
+2024-11-13 17:11:07,937 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:11:11,483 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:11,774 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:11,774 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:11:16,645 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:21,646 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:22,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:26,930 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:31,930 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:35,784 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:37,312 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:37,774 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:37,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:37,941 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:11:42,943 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:47,944 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:52,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:11:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:11:52,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:11:53,939 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:11:57,792 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:11:59,512 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:04,513 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:07,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:07,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:07,944 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:12:09,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:14,946 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:18,339 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:12:18,341 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:12:18,341 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:12:18,341 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:12:18,801 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:12:19,801 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:19,952 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:12:19,954 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,955 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:19,955 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,956 DEBUG   SenderThread:1939 [sender.py:send():382] send: metric
+2024-11-13 17:12:19,957 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:12:19,957 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:12:19,957 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:12:20,802 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:12:21,802 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:22,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:22,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:22,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:25,846 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:30,847 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:35,847 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:37,774 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:37,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:37,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:37,946 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:12:40,948 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:43,811 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:12:46,900 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:47,812 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/config.yaml
+2024-11-13 17:12:52,087 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:12:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:12:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:12:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:12:57,926 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:02,927 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:07,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:07,820 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:07,949 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:13:07,950 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:12,951 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:17,952 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:22,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:22,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:22,815 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:23,932 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:29,529 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:29,829 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:34,530 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:37,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:37,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:37,952 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:13:39,954 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:44,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:49,955 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:13:51,838 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:13:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:13:52,775 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:13:52,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:13:55,936 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:00,937 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:05,938 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:07,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:07,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:07,819 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:07,954 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:14:10,956 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:12,899 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:14:12,900 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:14:12,901 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:14:12,902 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:14:13,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:14:13,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:14,513 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:14:14,514 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:14:14,514 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:14:14,516 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:14:14,847 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:14:15,848 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:16,517 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:21,517 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:22,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:22,777 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:22,777 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:26,902 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:31,903 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:37,269 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:37,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:37,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:37,778 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:37,857 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:14:37,957 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:14:42,959 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:47,960 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:52,775 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:14:52,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:14:52,819 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:14:53,918 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:58,973 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:14:59,866 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:15:03,974 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:07,776 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:07,776 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:07,778 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:07,960 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:15:09,962 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:14,963 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:19,963 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:24,560 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:24,560 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:24,760 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:25,654 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:30,654 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:35,655 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:37,965 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:15:38,559 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:38,559 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:38,599 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:40,718 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:45,718 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:50,719 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:15:53,891 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:15:55,441 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:15:55,632 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:15:55,633 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:15:55,738 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:01,306 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:06,307 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:07,966 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:16:08,649 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:08,805 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:08,805 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:09,899 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:11,308 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:11,900 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:13,900 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:15,902 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:16,682 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:17,903 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:19,904 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:21,862 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:21,905 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:23,906 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:16:26,484 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:27,824 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:28,965 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:28,965 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:33,084 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:37,969 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:16:38,971 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:41,636 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:42,736 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:42,737 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:44,879 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:49,879 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:54,880 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:16:56,904 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:16:56,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:16:56,908 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:16:57,922 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:00,014 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:05,015 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:07,971 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:17:08,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:10,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:10,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:10,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:15,586 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:20,587 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:23,906 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:25,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:25,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:26,585 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:29,937 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:32,376 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:37,377 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:37,975 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:17:38,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:40,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:40,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:42,574 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:47,575 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:51,945 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:17:52,901 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:17:53,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:17:55,425 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:17:55,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:17:58,561 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:03,562 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:07,977 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:18:08,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:08,979 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:10,424 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:10,425 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:11,623 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:18:11,625 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:18:11,625 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:18:11,626 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:18:11,953 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:18:12,953 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:13,237 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: partial_history
+2024-11-13 17:18:13,239 DEBUG   SenderThread:1939 [sender.py:send():382] send: history
+2024-11-13 17:18:13,240 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: summary_record
+2024-11-13 17:18:13,241 INFO    SenderThread:1939 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
+2024-11-13 17:18:13,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/wandb-summary.json
+2024-11-13 17:18:13,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:14,242 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:14,954 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:19,242 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:23,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:24,243 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:25,427 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:25,427 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:29,574 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:34,575 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:37,980 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:18:38,907 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:38,963 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:18:39,981 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:40,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:40,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:45,524 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:50,525 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:18:53,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:18:55,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:18:55,426 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:18:55,571 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:00,972 INFO    Thread-12 :1939 [dir_watcher.py:_on_file_modified():288] file/dir modified: /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/files/output.log
+2024-11-13 17:19:01,259 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:06,259 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report
+2024-11-13 17:19:07,982 DEBUG   SenderThread:1939 [sender.py:send():382] send: stats
+2024-11-13 17:19:08,908 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: internal_messages
+2024-11-13 17:19:10,426 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: stop_status
+2024-11-13 17:19:10,427 DEBUG   SenderThread:1939 [sender.py:send_request():409] send_request: stop_status
+2024-11-13 17:19:11,531 DEBUG   HandlerThread:1939 [handler.py:handle_request():146] handle_request: status_report

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug.log ADDED Viewed

	@@ -0,0 +1,30 @@

+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Current SDK version is 0.16.3
+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Configure stats pid to 173
+2024-11-13 17:10:07,429 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from /opt/ml/code/wandb/settings
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'root_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'api_key': '***REDACTED***', 'project': 'sft-codecontests-1112', 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': 'qlearning_reasoning/training/sft.py', 'program_abspath': '/opt/ml/code/qlearning_reasoning/training/sft.py', 'program': '/opt/ml/code/qlearning_reasoning/training/sft.py'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:_log_setup():526] Logging user logs to /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug.log
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:_log_setup():527] Logging internal logs to /opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/logs/debug-internal.log
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():566] calling init triggers
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():573] wandb.init called with sweep_config: {}
+config: {'sagemaker_training_job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'batch_size': 64, 'cache_dir': '/opt/ml/data/input/.cache', 'dataset': 'code-contests', 'gradient_accumulation_steps': 8, 'logging_steps': 5, 'lr': '1e-5', 'max_seq_length': 2048, 'model_name': 'Qwen/Qwen2.5-Coder-7B-Instruct', 'num_train_epochs': 2, 'output_dir': '/opt/ml/output', 'push_to_hub': 'true', 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'sagemaker_container_log_level': 20, 'sagemaker_instance_type': 'ml.p5.48xlarge', 'sagemaker_job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'sagemaker_program': 'sft.py', 'sagemaker_region': 'us-east-1', 'sagemaker_submit_directory': 's3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz', 'sagemaker_torch_distributed_enabled': 'true', 'save_steps': 100, 'schedule': 'cosine', 'wandb_project': 'sft-codecontests-1112', 'weight_decay': 0.0, 'additional_framework_parameters': {'sagemaker_instance_type': 'ml.p5.48xlarge', 'sagemaker_torch_distributed_enabled': True}, 'channel_input_dirs': {}, 'current_host': 'algo-1', 'current_instance_group': 'homogeneousCluster', 'current_instance_group_hosts': ['algo-1'], 'current_instance_type': 'ml.p5.48xlarge', 'distribution_hosts': ['algo-1'], 'distribution_instance_groups': ['homogeneousCluster'], 'framework_module': 'sagemaker_pytorch_container.training:main', 'hosts': ['algo-1'], 'hyperparameters': {'batch_size': 64, 'cache_dir': '/opt/ml/data/input/.cache', 'dataset': 'code-contests', 'gradient_accumulation_steps': 8, 'logging_steps': 5, 'lr': '1e-5', 'max_seq_length': 2048, 'model_name': 'Qwen/Qwen2.5-Coder-7B-Instruct', 'num_train_epochs': 2, 'output_dir': '/opt/ml/model/', 'push_to_hub': True, 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'save_steps': 100, 'schedule': 'cosine', 'wandb_project': 'sft-codecontests-1112', 'weight_decay': 0.0}, 'input_config_dir': '/opt/ml/input/config', 'input_data_config': {}, 'input_dir': '/opt/ml/input', 'instance_groups': ['homogeneousCluster'], 'instance_groups_dict': {'homogeneousCluster': {'hosts': ['algo-1'], 'instance_group_name': 'homogeneousCluster', 'instance_type': 'ml.p5.48xlarge'}}, 'is_hetero': False, 'is_master': True, 'is_modelparallel_enabled': None, 'is_smddpmprun_installed': False, 'is_smddprun_installed': True, 'job_name': 'kushalarora-rvv-main-2024-11-13-16-43-09-915', 'log_level': 20, 'master_hostname': 'algo-1', 'model_dir': '/opt/ml/model', 'module_dir': 's3://tri-ml-datasets/kushalarora-rvv-main-2024-11-13-16-43-09-915/source/sourcedir.tar.gz', 'module_name': '/opt/ml/code/qlearning_reasoning/training/sft', 'network_interface_name': 'eth0', 'num_cpus': 192, 'num_gpus': 8, 'num_neurons': 0, 'output_data_dir': '/opt/ml/output/data', 'output_intermediate_dir': '/opt/ml/output/intermediate', 'resource_config': {'current_group_name': 'homogeneousCluster', 'current_host': 'algo-1', 'current_instance_type': 'ml.p5.48xlarge', 'hosts': ['algo-1'], 'instance_groups': [{'hosts': ['algo-1'], 'instance_group_name': 'homogeneousCluster', 'instance_type': 'ml.p5.48xlarge'}], 'network_interface_name': 'eth0'}, 'user_entry_point': '/opt/ml/code/qlearning_reasoning/training/sft.py'}
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():616] starting backend
+2024-11-13 17:10:07,430 INFO    MainThread:173 [wandb_init.py:init():620] setting up manager
+2024-11-13 17:10:07,431 INFO    MainThread:173 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
+2024-11-13 17:10:07,432 INFO    MainThread:173 [wandb_init.py:init():628] backend started and connected
+2024-11-13 17:10:07,435 INFO    MainThread:173 [wandb_init.py:init():720] updated telemetry
+2024-11-13 17:10:07,442 INFO    MainThread:173 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
+2024-11-13 17:10:07,759 INFO    MainThread:173 [wandb_run.py:_on_init():2262] communicating current version
+2024-11-13 17:10:07,794 INFO    MainThread:173 [wandb_run.py:_on_init():2271] got version response upgrade_message: "wandb version 0.18.6 is available!  To upgrade, please run:\n $ pip install wandb --upgrade"
+2024-11-13 17:10:07,794 INFO    MainThread:173 [wandb_init.py:init():804] starting run threads in backend
+2024-11-13 17:10:22,774 INFO    MainThread:173 [wandb_run.py:_console_start():2241] atexit reg
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2096] redirect: wrap_raw
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2161] Wrapping output streams.
+2024-11-13 17:10:22,775 INFO    MainThread:173 [wandb_run.py:_redirect():2186] Redirects installed.
+2024-11-13 17:10:22,776 INFO    MainThread:173 [wandb_init.py:init():847] run started, returning control to user process
+2024-11-13 17:10:22,778 INFO    MainThread:173 [wandb_run.py:_config_callback():1343] config_cb None None {'vocab_size': 151671, 'max_position_embeddings': 32768, 'hidden_size': 3584, 'intermediate_size': 18944, 'num_hidden_layers': 28, 'num_attention_heads': 28, 'use_sliding_window': False, 'sliding_window': None, 'max_window_layers': 28, 'num_key_value_heads': 4, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000.0, 'rope_scaling': None, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'bfloat16', 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': False, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['Qwen2ForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'Qwen/Qwen2.5-Coder-7B-Instruct', '_attn_implementation_autoset': True, 'transformers_version': '4.46.0', 'model_type': 'qwen2', 'output_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 8, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 1e-05, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 2, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/opt/ml/model//sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048/runs/Nov13_17-09-37_algo-1', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'epoch', 'save_steps': 100, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 5, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_acc-8_len-2048', 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': ['full_shard', 'auto_wrap'], 'fsdp_min_num_params': 0, 'fsdp_config': {'activation_checkpointing': False, 'auto_wrap_policy': 'TRANSFORMER_BASED_WRAP', 'backward_prefetch': 'BACKWARD_PRE', 'cpu_ram_efficient_loading': True, 'forward_prefetch': False, 'offload_params': False, 'sharding_strategy': 'FULL_SHARD', 'state_dict_type': 'FULL_STATE_DICT', 'sync_module_states': True, 'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': 'sft-codecontests-qwen_ds-code-contests_model-Qwen2.5-Coder-7B-Instruct_sch-cosine_lr-1e-5_bs-64_', 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': {'use_reentrant': False}, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': None, 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'dataset_text_field': 'text', 'packing': False, 'max_seq_length': 2048, 'dataset_num_proc': None, 'dataset_batch_size': 64, 'model_init_kwargs': None, 'dataset_kwargs': {}, 'eval_packing': None, 'num_of_sequences': 1024, 'chars_per_token': '<CHARS_PER_TOKEN>', 'use_liger': False}
+2024-11-13 17:10:22,783 INFO    MainThread:173 [wandb_config.py:__setitem__():151] config set model/num_parameters = 951599936 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f533489f280>>
+2024-11-13 17:10:22,783 INFO    MainThread:173 [wandb_run.py:_config_callback():1343] config_cb model/num_parameters 951599936 None

wandb/run-20241113_171007-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1/run-kushalarora-rvv-main-2024-11-13-16-43-09-915-0exw0n-algo-1.wandb ADDED Viewed

Binary file (392 kB). View file