less noisy
Browse files
model.py
CHANGED
@@ -410,9 +410,9 @@ def disable_dropout(model: torch.nn.Module):
|
|
410 |
dropout_modules = [m for m in model.modules() if isinstance(m, torch.nn.Dropout)]
|
411 |
for m in dropout_modules:
|
412 |
m.p = 0.0
|
413 |
-
print0(
|
414 |
-
|
415 |
-
)
|
416 |
|
417 |
|
418 |
def disable_causality(model: torch.nn.Module):
|
@@ -793,7 +793,7 @@ class DatasetConditionedBiencoder(transformers.PreTrainedModel, ContextualModelM
|
|
793 |
if hasattr(module, "rotary_emb_dim"):
|
794 |
module.rotary_start_pos = rotary_start_pos
|
795 |
rotary_disabled += 1
|
796 |
-
print0(f"modified {rotary_disabled} rotary modules – set rotary_start_pos to {rotary_start_pos}")
|
797 |
|
798 |
def forward(
|
799 |
self,
|
|
|
410 |
dropout_modules = [m for m in model.modules() if isinstance(m, torch.nn.Dropout)]
|
411 |
for m in dropout_modules:
|
412 |
m.p = 0.0
|
413 |
+
#print0(
|
414 |
+
# f"Disabled {len(dropout_modules)} dropout modules from model type {type(model)}"
|
415 |
+
#)
|
416 |
|
417 |
|
418 |
def disable_causality(model: torch.nn.Module):
|
|
|
793 |
if hasattr(module, "rotary_emb_dim"):
|
794 |
module.rotary_start_pos = rotary_start_pos
|
795 |
rotary_disabled += 1
|
796 |
+
# print0(f"modified {rotary_disabled} rotary modules – set rotary_start_pos to {rotary_start_pos}")
|
797 |
|
798 |
def forward(
|
799 |
self,
|