test / modules /dml /hijack /tomesd.py
bilegentile's picture
Upload folder using huggingface_hub
c19ca42 verified
raw
history blame contribute delete
879 Bytes
import torch
import tomesd
from typing import Type
from modules.dml.hijack.utils import catch_nan
def make_tome_block(block_class: Type[torch.nn.Module]) -> Type[torch.nn.Module]:
class ToMeBlock(block_class):
# Save for unpatching later
_parent = block_class
def _forward(self, x: torch.Tensor, context: torch.Tensor = None) -> torch.Tensor:
m_a, m_c, m_m, u_a, u_c, u_m = tomesd.patch.compute_merge(x, self._tome_info)
# This is where the meat of the computation happens
x = u_a(self.attn1(m_a(self.norm1(x)), context=context if self.disable_self_attn else None)) + x
x = catch_nan(lambda: (u_c(self.attn2(m_c(self.norm2(x)), context=context)) + x))
x = u_m(self.ff(m_m(self.norm3(x)))) + x
return x
return ToMeBlock
tomesd.patch.make_tome_block = make_tome_block