[WIP] need refactor.
This commit is contained in:
@@ -62,6 +62,7 @@ class Config:
|
||||
xattn_keep_sink: bool = False # Always keep first block (sink tokens)
|
||||
xattn_keep_recent: bool = False # Always keep recent diagonal blocks
|
||||
xattn_norm: float = 1.0 # Normalization factor for attention scores
|
||||
xattn_use_bsa: bool = True # Use Block Sparse Attention library (requires installation)
|
||||
|
||||
def __post_init__(self):
|
||||
assert os.path.isdir(self.model)
|
||||
|
||||
Reference in New Issue
Block a user