language-translation / config.json
Avanthika's picture
Upload config.json
9ce941d
{
"Transformer": {
"encoder": {
"sentence_embedding": {
"embedding": {
"num_embeddings": 71,
"embedding_dim": 512
},
"position_encoder": {},
"dropout": 0.1
},
"layers": [
{
"attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"norm1": {},
"dropout1": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"norm2": {},
"dropout2": 0.1
},
{
"attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"norm1": {},
"dropout1": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"norm2": {},
"dropout2": 0.1
},
{
"attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"norm1": {},
"dropout1": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"norm2": {},
"dropout2": 0.1
}
]
},
"decoder": {
"sentence_embedding": {
"embedding": {
"num_embeddings": 125,
"embedding_dim": 512
},
"position_encoder": {},
"dropout": 0.1
},
"layers": [
{
"self_attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm1": {},
"dropout1": 0.1,
"encoder_decoder_attention": {
"kv_layer": {
"in_features": 512,
"out_features": 1024,
"bias": true
},
"q_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm2": {},
"dropout2": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"layer_norm3": {},
"dropout3": 0.1
},
{
"self_attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm1": {},
"dropout1": 0.1,
"encoder_decoder_attention": {
"kv_layer": {
"in_features": 512,
"out_features": 1024,
"bias": true
},
"q_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm2": {},
"dropout2": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"layer_norm3": {},
"dropout3": 0.1
},
{
"self_attention": {
"qkv_layer": {
"in_features": 512,
"out_features": 1536,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm1": {},
"dropout1": 0.1,
"encoder_decoder_attention": {
"kv_layer": {
"in_features": 512,
"out_features": 1024,
"bias": true
},
"q_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
},
"linear_layer": {
"in_features": 512,
"out_features": 512,
"bias": true
}
},
"layer_norm2": {},
"dropout2": 0.1,
"ffn": {
"linear1": {
"in_features": 512,
"out_features": 2048,
"bias": true
},
"linear2": {
"in_features": 2048,
"out_features": 512,
"bias": true
}
},
"layer_norm3": {},
"dropout3": 0.1
}
]
},
"linear": {
"in_features": 512,
"out_features": 125,
"bias": true
}
}
}