Update app.py
Browse files
app.py
CHANGED
|
@@ -329,7 +329,7 @@ pipeline = LTX23DistilledA2VPipeline(
|
|
| 329 |
spatial_upsampler_path=spatial_upsampler_path,
|
| 330 |
gemma_root=gemma_root,
|
| 331 |
loras=[],
|
| 332 |
-
quantization=
|
| 333 |
)
|
| 334 |
# ----------------------------------------------------------------
|
| 335 |
|
|
@@ -428,7 +428,7 @@ def prepare_lora_cache(
|
|
| 428 |
spatial_upsampler_path=str(spatial_upsampler_path),
|
| 429 |
gemma_root_path=str(gemma_root),
|
| 430 |
loras=tuple(loras_for_builder),
|
| 431 |
-
quantization=
|
| 432 |
)
|
| 433 |
new_transformer_cpu = tmp_ledger.transformer()
|
| 434 |
|
|
|
|
| 329 |
spatial_upsampler_path=spatial_upsampler_path,
|
| 330 |
gemma_root=gemma_root,
|
| 331 |
loras=[],
|
| 332 |
+
quantization=QuantizationPolicy.fp8_cast(),
|
| 333 |
)
|
| 334 |
# ----------------------------------------------------------------
|
| 335 |
|
|
|
|
| 428 |
spatial_upsampler_path=str(spatial_upsampler_path),
|
| 429 |
gemma_root_path=str(gemma_root),
|
| 430 |
loras=tuple(loras_for_builder),
|
| 431 |
+
quantization=QuantizationPolicy.fp8_cast(),
|
| 432 |
)
|
| 433 |
new_transformer_cpu = tmp_ledger.transformer()
|
| 434 |
|