klemenk commited on
Commit
7b60bd0
·
verified ·
1 Parent(s): 2cad72d

Copy configuration_auristream.py from TuKoResearch/AuriStream1B_40Pred_librilight_500k

Browse files
Files changed (1) hide show
  1. configuration_auristream.py +28 -0
configuration_auristream.py ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from transformers import PretrainedConfig
2
+
3
+ class AuriStreamConfig(PretrainedConfig):
4
+ model_type = "AuriStream.AuriStream"
5
+
6
+ def __init__(
7
+ self,
8
+ n_layer=48,
9
+ n_head=16,
10
+ n_embd=1280,
11
+ vocab_size=8192,
12
+ dropout=0.0,
13
+ bias=False,
14
+ use_rope=False,
15
+ n_pred_steps=20,
16
+ seq_len=4096,
17
+ **kwargs
18
+ ):
19
+ self.n_layer = n_layer
20
+ self.n_head = n_head
21
+ self.n_embd = n_embd
22
+ self.vocab_size = vocab_size
23
+ self.dropout = dropout
24
+ self.bias = bias
25
+ self.use_rope = use_rope
26
+ self.n_pred_steps = n_pred_steps
27
+ self.seq_len = seq_len
28
+ super().__init__(**kwargs)