|
{ |
|
"model_name": "ai-coder-v1", |
|
"model_type": "llama", |
|
"vocab_size": 10000, |
|
"n_positions": 2048, |
|
"n_ctx": 2048, |
|
"n_embd": 512, |
|
"n_layer": 6, |
|
"n_head": 8, |
|
"n_kv_head": 4, |
|
"rotary_dim": 64, |
|
"activation_function": "swiglu", |
|
"layer_norm_epsilon": 1e-05, |
|
"initializer_range": 0.02, |
|
"use_cache": true, |
|
"rope_scaling": { |
|
"type": "dynamic", |
|
"factor": 2.0 |
|
}, |
|
"sliding_window": 1024, |
|
"attention_config": { |
|
"type": "multi_query", |
|
"head_dim": 64, |
|
"kv_heads": 4, |
|
"sliding_window": 1024, |
|
"attention_dropout": 0.1 |
|
}, |
|
"architectures": [ |
|
"LlamaForCausalLM" |
|
], |
|
"tokenizer_class": "CodeTokenizer", |
|
"tie_word_embeddings": true, |
|
"torch_dtype": "bfloat16", |
|
"transformers_version": "4.37.0", |
|
"flash_attention": false, |
|
"gradient_checkpointing": false, |
|
"use_memory_efficient_attention": false, |
|
"parallel_attention": false, |
|
"learning_config": { |
|
"online_learning": { |
|
"enabled": false, |
|
"learning_rate": 0.0001, |
|
"batch_size": 16, |
|
"max_steps": 100, |
|
"warmup_steps": 10 |
|
}, |
|
"meta_learning": { |
|
"enabled": false, |
|
"inner_learning_rate": 0.001, |
|
"outer_learning_rate": 0.0001, |
|
"num_inner_steps": 3, |
|
"num_outer_steps": 10 |
|
}, |
|
"active_learning": { |
|
"enabled": true, |
|
"uncertainty_threshold": 0.8, |
|
"max_queries_per_session": 5, |
|
"min_confidence_score": 0.6 |
|
}, |
|
"knowledge_distillation": { |
|
"enabled": true, |
|
"temperature": 2.0, |
|
"alpha": 0.5, |
|
"teacher_models": [ |
|
"gpt-4", |
|
"claude-3" |
|
] |
|
}, |
|
"feedback_learning": { |
|
"enabled": true, |
|
"feedback_buffer_size": 1000, |
|
"min_feedback_samples": 50, |
|
"update_interval": 100 |
|
}, |
|
"optimization": { |
|
"optimizer": "adamw", |
|
"weight_decay": 0.01, |
|
"learning_rate_scheduler": "cosine", |
|
"warmup_ratio": 0.1, |
|
"gradient_clip_val": 1.0 |
|
} |
|
}, |
|
"advanced_features": { |
|
"code_completion": true, |
|
"type_inference": true, |
|
"semantic_analysis": true, |
|
"refactoring": true, |
|
"bug_detection": true, |
|
"security_analysis": true, |
|
"performance_optimization": true, |
|
"style_checking": true, |
|
"documentation_generation": true, |
|
"test_generation": true, |
|
"multi_language_support": true, |
|
"framework_detection": true |
|
} |
|
} |
|
|