Testing3

Runtime error

dagloop5 commited on Mar 18

Commit

f5c3128

verified ·

1 Parent(s): 6ab2dfe

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -338,19 +338,6 @@ if quant is not None:
     quant_kwargs["quantization"] = quant
 # --- END robust CUDA detection and quant selection ---
-# Only enable FP8 quantization if CUDA is present (FP8 uses Triton/CUDA kernels).
-# If QuantizationPolicy defines a no-op or 'none' option, use it; otherwise omit the arg.
-quant = None
-if use_cuda:
-    quant = QuantizationPolicy.fp8_cast()
-else:
-    # try to use a 'none' policy if available; otherwise we'll omit quantization
-    quant = getattr(QuantizationPolicy, "none", None)
-quant_kwargs = {}
-if quant is not None:
-    quant_kwargs["quantization"] = quant
 pipeline = LTX23DistilledA2VPipeline(
     distilled_checkpoint_path=checkpoint_path,
     spatial_upsampler_path=spatial_upsampler_path,
@@ -364,7 +351,7 @@ pipeline = LTX23DistilledA2VPipeline(
 print("Preloading models (GPU preloads only if CUDA is available)...")
 ledger = pipeline.model_ledger
-if torch.cuda.is_available():
     try:
         # Preload models (this will trigger GPU-side building; only do this when CUDA is present)
         _transformer = ledger.transformer()

     quant_kwargs["quantization"] = quant
 # --- END robust CUDA detection and quant selection ---
 pipeline = LTX23DistilledA2VPipeline(
     distilled_checkpoint_path=checkpoint_path,
     spatial_upsampler_path=spatial_upsampler_path,
 print("Preloading models (GPU preloads only if CUDA is available)...")
 ledger = pipeline.model_ledger
+if use_cuda:
     try:
         # Preload models (this will trigger GPU-side building; only do this when CUDA is present)
         _transformer = ledger.transformer()