Update app.py
Browse files
app.py
CHANGED
|
@@ -260,6 +260,7 @@ checkpoint_path = hf_hub_download(
|
|
| 260 |
local_dir=str(weights_dir),
|
| 261 |
local_dir_use_symlinks=False,
|
| 262 |
)
|
|
|
|
| 263 |
|
| 264 |
print("[Gemma] Setting up abliterated Gemma text encoder...")
|
| 265 |
MERGED_WEIGHTS = "/tmp/abliterated_gemma_merged.safetensors"
|
|
@@ -361,12 +362,14 @@ print(f"Realism LoRA: {realism_lora_path}")
|
|
| 361 |
print(f"Transition LoRA: {transition_lora_path}")
|
| 362 |
# ----------------------------------------------------------------
|
| 363 |
|
|
|
|
| 364 |
print(f"Checkpoint: {checkpoint_path}")
|
| 365 |
|
| 366 |
# Initialize pipeline WITH text encoder and optional audio support
|
| 367 |
# ---- Replace block (pipeline init) lines 275-281 ----
|
| 368 |
pipeline = LTX23DistilledA2VPipeline(
|
| 369 |
distilled_checkpoint_path=checkpoint_path,
|
|
|
|
| 370 |
gemma_root=gemma_root,
|
| 371 |
loras=[],
|
| 372 |
quantization=QuantizationPolicy.fp8_cast(), # keep FP8 quantization unchanged
|
|
@@ -522,6 +525,7 @@ _orig_video_decoder_factory = ledger.video_decoder
|
|
| 522 |
_orig_audio_encoder_factory = ledger.audio_encoder
|
| 523 |
_orig_audio_decoder_factory = ledger.audio_decoder
|
| 524 |
_orig_vocoder_factory = ledger.vocoder
|
|
|
|
| 525 |
_orig_text_encoder_factory = ledger.text_encoder
|
| 526 |
_orig_gemma_embeddings_factory = ledger.gemma_embeddings_processor
|
| 527 |
|
|
@@ -532,6 +536,7 @@ _video_decoder = _orig_video_decoder_factory()
|
|
| 532 |
_audio_encoder = _orig_audio_encoder_factory()
|
| 533 |
_audio_decoder = _orig_audio_decoder_factory()
|
| 534 |
_vocoder = _orig_vocoder_factory()
|
|
|
|
| 535 |
_text_encoder = _orig_text_encoder_factory()
|
| 536 |
_embeddings_processor = _orig_gemma_embeddings_factory()
|
| 537 |
|
|
@@ -543,6 +548,7 @@ ledger.video_decoder = lambda: _video_decoder
|
|
| 543 |
ledger.audio_encoder = lambda: _audio_encoder
|
| 544 |
ledger.audio_decoder = lambda: _audio_decoder
|
| 545 |
ledger.vocoder = lambda: _vocoder
|
|
|
|
| 546 |
ledger.text_encoder = lambda: _text_encoder
|
| 547 |
ledger.gemma_embeddings_processor = lambda: _embeddings_processor
|
| 548 |
|
|
|
|
| 260 |
local_dir=str(weights_dir),
|
| 261 |
local_dir_use_symlinks=False,
|
| 262 |
)
|
| 263 |
+
spatial_upsampler_path = hf_hub_download(repo_id=LTX_MODEL_REPO, filename="ltx-2.3-spatial-upscaler-x2-1.0.safetensors")
|
| 264 |
|
| 265 |
print("[Gemma] Setting up abliterated Gemma text encoder...")
|
| 266 |
MERGED_WEIGHTS = "/tmp/abliterated_gemma_merged.safetensors"
|
|
|
|
| 362 |
print(f"Transition LoRA: {transition_lora_path}")
|
| 363 |
# ----------------------------------------------------------------
|
| 364 |
|
| 365 |
+
print(f"Spatial upsampler: {spatial_upsampler_path}")
|
| 366 |
print(f"Checkpoint: {checkpoint_path}")
|
| 367 |
|
| 368 |
# Initialize pipeline WITH text encoder and optional audio support
|
| 369 |
# ---- Replace block (pipeline init) lines 275-281 ----
|
| 370 |
pipeline = LTX23DistilledA2VPipeline(
|
| 371 |
distilled_checkpoint_path=checkpoint_path,
|
| 372 |
+
spatial_upsampler_path=spatial_upsampler_path,
|
| 373 |
gemma_root=gemma_root,
|
| 374 |
loras=[],
|
| 375 |
quantization=QuantizationPolicy.fp8_cast(), # keep FP8 quantization unchanged
|
|
|
|
| 525 |
_orig_audio_encoder_factory = ledger.audio_encoder
|
| 526 |
_orig_audio_decoder_factory = ledger.audio_decoder
|
| 527 |
_orig_vocoder_factory = ledger.vocoder
|
| 528 |
+
_orig_spatial_upsampler_factory = ledger.spatial_upsampler
|
| 529 |
_orig_text_encoder_factory = ledger.text_encoder
|
| 530 |
_orig_gemma_embeddings_factory = ledger.gemma_embeddings_processor
|
| 531 |
|
|
|
|
| 536 |
_audio_encoder = _orig_audio_encoder_factory()
|
| 537 |
_audio_decoder = _orig_audio_decoder_factory()
|
| 538 |
_vocoder = _orig_vocoder_factory()
|
| 539 |
+
_spatial_upsampler = _orig_spatial_upsampler_factory()
|
| 540 |
_text_encoder = _orig_text_encoder_factory()
|
| 541 |
_embeddings_processor = _orig_gemma_embeddings_factory()
|
| 542 |
|
|
|
|
| 548 |
ledger.audio_encoder = lambda: _audio_encoder
|
| 549 |
ledger.audio_decoder = lambda: _audio_decoder
|
| 550 |
ledger.vocoder = lambda: _vocoder
|
| 551 |
+
ledger.spatial_upsampler = lambda: _spatial_upsampler
|
| 552 |
ledger.text_encoder = lambda: _text_encoder
|
| 553 |
ledger.gemma_embeddings_processor = lambda: _embeddings_processor
|
| 554 |
|