KitsuVp
/

NeoLLM

@@ -279,14 +279,6 @@ class NeoLLMConfig(PretrainedConfig):
             values, such as ``32``, are valid memory-saving variants but are
             not the full paper-faithful default. Ignored when
             ``use_token_generator=False``.
-        generator_khronos_chunk_size (:obj:`int`, *optional*, defaults to 16):
-            Number of seed dimensions evaluated at once inside the Leviathan
-            KHRONOS tensor product.  This does not change the mathematical
-            function: it computes the same product by accumulating
-            ``Σ_d log|phi_d|`` over chunks.  The default ``16`` avoids
-            materializing the full ``[N, d_seed, krank]`` tensor during
-            torch.compile/AOTAutograd while preserving the article's separable
-            product.
         use_jtokm (:obj:`bool`, *optional*, defaults to ``False``):
             Enable the **Leviathan-JTok-M** token-indexed modulation module
             (Yang et al., 2026; fused with Leviathan geometry).
@@ -707,14 +699,13 @@ class NeoLLMConfig(PretrainedConfig):
         # ── Embedding input normalization ─────────────────────────────────
         use_embedding_input_norm=True,
         # ── Leviathan continuous token generator ──────────────────────────
-        use_token_generator=False,
         generator_d_seed=128,
         generator_num_modes=8,
         generator_num_knots=32,
         generator_spline_degree=2,
         generator_k=3,
         generator_krank=64,
-        generator_khronos_chunk_size=16,
         # ── Leviathan-JTok-M token-indexed modulation ─────────────────────
         use_jtokm=False,
         jtokm_num_experts=4,
@@ -1047,7 +1038,6 @@ class NeoLLMConfig(PretrainedConfig):
         self.generator_spline_degree       = generator_spline_degree
         self.generator_k                   = generator_k
         self.generator_krank               = generator_krank
-        self.generator_khronos_chunk_size  = generator_khronos_chunk_size
         # ── Leviathan-JTok-M ─────────────────────────────────────────────
         self.use_jtokm                     = use_jtokm

             values, such as ``32``, are valid memory-saving variants but are
             not the full paper-faithful default. Ignored when
             ``use_token_generator=False``.
         use_jtokm (:obj:`bool`, *optional*, defaults to ``False``):
             Enable the **Leviathan-JTok-M** token-indexed modulation module
             (Yang et al., 2026; fused with Leviathan geometry).
         # ── Embedding input normalization ─────────────────────────────────
         use_embedding_input_norm=True,
         # ── Leviathan continuous token generator ──────────────────────────
+        use_token_generator=True,
         generator_d_seed=128,
         generator_num_modes=8,
         generator_num_knots=32,
         generator_spline_degree=2,
         generator_k=3,
         generator_krank=64,
         # ── Leviathan-JTok-M token-indexed modulation ─────────────────────
         use_jtokm=False,
         jtokm_num_experts=4,
         self.generator_spline_degree       = generator_spline_degree
         self.generator_k                   = generator_k
         self.generator_krank               = generator_krank
         # ── Leviathan-JTok-M ─────────────────────────────────────────────
         self.use_jtokm                     = use_jtokm