File size: 385 Bytes
550eb56 |
1 2 3 4 5 6 7 8 9 10 11 |
"""
DeepSeek Multi-Latent Attention Implementation
Copyright (c) 2025
Implementation of the Multi-Latent Attention mechanism from the DeepSeek-V2 paper.
"""
from .mla import MultiLatentAttention, precompute_freqs_cis, reshape_for_broadcast, apply_rotary_emb
__version__ = "0.1.0"
__all__ = ["MultiLatentAttention", "precompute_freqs_cis", "reshape_for_broadcast","apply_rotary_emb"] |