Jaleah-AI / config.json
teckmill's picture
Upload 3 files
0957be2 verified
{
"model_name": "ai-coder-v1",
"model_type": "llama",
"vocab_size": 10000,
"n_positions": 2048,
"n_ctx": 2048,
"n_embd": 512,
"n_layer": 6,
"n_head": 8,
"n_kv_head": 4,
"rotary_dim": 64,
"activation_function": "swiglu",
"layer_norm_epsilon": 1e-05,
"initializer_range": 0.02,
"use_cache": true,
"rope_scaling": {
"type": "dynamic",
"factor": 2.0
},
"sliding_window": 1024,
"attention_config": {
"type": "multi_query",
"head_dim": 64,
"kv_heads": 4,
"sliding_window": 1024,
"attention_dropout": 0.1
},
"architectures": [
"LlamaForCausalLM"
],
"tokenizer_class": "CodeTokenizer",
"tie_word_embeddings": true,
"torch_dtype": "bfloat16",
"transformers_version": "4.37.0",
"flash_attention": false,
"gradient_checkpointing": false,
"use_memory_efficient_attention": false,
"parallel_attention": false,
"learning_config": {
"online_learning": {
"enabled": false,
"learning_rate": 0.0001,
"batch_size": 16,
"max_steps": 100,
"warmup_steps": 10
},
"meta_learning": {
"enabled": false,
"inner_learning_rate": 0.001,
"outer_learning_rate": 0.0001,
"num_inner_steps": 3,
"num_outer_steps": 10
},
"active_learning": {
"enabled": true,
"uncertainty_threshold": 0.8,
"max_queries_per_session": 5,
"min_confidence_score": 0.6
},
"knowledge_distillation": {
"enabled": true,
"temperature": 2.0,
"alpha": 0.5,
"teacher_models": [
"gpt-4",
"claude-3"
]
},
"feedback_learning": {
"enabled": true,
"feedback_buffer_size": 1000,
"min_feedback_samples": 50,
"update_interval": 100
},
"optimization": {
"optimizer": "adamw",
"weight_decay": 0.01,
"learning_rate_scheduler": "cosine",
"warmup_ratio": 0.1,
"gradient_clip_val": 1.0
}
},
"advanced_features": {
"code_completion": true,
"type_inference": true,
"semantic_analysis": true,
"refactoring": true,
"bug_detection": true,
"security_analysis": true,
"performance_optimization": true,
"style_checking": true,
"documentation_generation": true,
"test_generation": true,
"multi_language_support": true,
"framework_detection": true
}
}