Spaces:
Running
on
Zero
Running
on
Zero
Upload sparse_elastic_mixin.py
Browse files
trellis/models/sparse_elastic_mixin.py
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
from contextlib import contextmanager
|
2 |
+
from typing import *
|
3 |
+
import math
|
4 |
+
from ..modules import sparse as sp
|
5 |
+
from ..utils.elastic_utils import ElasticModuleMixin
|
6 |
+
|
7 |
+
|
8 |
+
class SparseTransformerElasticMixin(ElasticModuleMixin):
|
9 |
+
def _get_input_size(self, x: sp.SparseTensor, *args, **kwargs):
|
10 |
+
return x.feats.shape[0]
|
11 |
+
|
12 |
+
@contextmanager
|
13 |
+
def with_mem_ratio(self, mem_ratio=1.0):
|
14 |
+
if mem_ratio == 1.0:
|
15 |
+
yield 1.0
|
16 |
+
return
|
17 |
+
num_blocks = len(self.blocks)
|
18 |
+
num_checkpoint_blocks = min(math.ceil((1 - mem_ratio) * num_blocks) + 1, num_blocks)
|
19 |
+
exact_mem_ratio = 1 - (num_checkpoint_blocks - 1) / num_blocks
|
20 |
+
for i in range(num_blocks):
|
21 |
+
self.blocks[i].use_checkpoint = i < num_checkpoint_blocks
|
22 |
+
yield exact_mem_ratio
|
23 |
+
for i in range(num_blocks):
|
24 |
+
self.blocks[i].use_checkpoint = False
|