File size: 583 Bytes
9a695c6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
default_stage:
  default_modifiers:
    QuantizationModifier:
      config_groups:
        attention:
          targets: [LlamaAttention]
          weights: null
          input_activations:
            num_bits: 8
            type: float
            symmetric: true
            group_size: null
            strategy: attn_head
            block_structure: null
            dynamic: false
            actorder: null
            observer: static_minmax
            observer_kwargs: {}
          output_activations: null
          format: null
      targets: [Linear]
      ignore: []