siliconflow · lixiang007666 · Jun 30, 2024 · Jun 30, 2024 · Jul 29, 2024 · Jul 29, 2024
diff --git a/onediff_diffusers_extensions/examples/lightning/README.md b/onediff_diffusers_extensions/examples/lightning/README.md
@@ -0,0 +1,13 @@
+Run:    
+
+
+```
+python3 onediff_diffusers_extensions/tools/quantization/quantize-sd-fast.py \
+   --quantized_model ./sdxl_lightning_quant \
+   --conv_ssim_threshold 0.1 \
+   --linear_ssim_threshold 0.1 \
+   --conv_compute_density_threshold 900 \
+   --linear_compute_density_threshold 300 \
+   --save_as_float true \
+   --use_lightning 1
+```
diff --git a/onediff_diffusers_extensions/tools/quantization/quantize-sd-fast.py b/onediff_diffusers_extensions/tools/quantization/quantize-sd-fast.py
@@ -11,7 +11,10 @@
     StableDiffusionXLImg2ImgPipeline,
     StableDiffusionPipeline,
     StableDiffusionImg2ImgPipeline,
+    UNet2DConditionModel
 )
+from safetensors.torch import load_file
+from huggingface_hub import hf_hub_download
 
 from onediff.quantization import QuantPipeline
 
@@ -62,6 +65,9 @@
 )
 parser.add_argument("--seed", type=int, default=111)
 parser.add_argument("--cache_dir", type=str, default=None)
+parser.add_argument("--use_lightning", type=(lambda x: str(x).lower() in ["true", "1", "yes"]), default=False, help="Use the SDXL Lightning model if true")
+parser.add_argument("--lightning_ckpt", type=str, default="sdxl_lightning_4step_unet.safetensors",
+                    help="Checkpoint file name for the ByteDance SDXL-Lightning model")
 args = parser.parse_args()
 
 pipeline_cls = AutoPipelineForText2Image if args.input_image is None else AutoPipelineForImage2Image
@@ -87,6 +93,19 @@
             use_safetensors=True,
         )
 
+if args.use_lightning:
+    repo = "ByteDance/SDXL-Lightning"
+    ckpt = args.lightning_ckpt
+    unet = UNet2DConditionModel.from_config(args.model, subfolder="unet").to("cuda", torch.float16)
+    unet.load_state_dict(load_file(hf_hub_download(repo, ckpt), device="cuda"))
+    pipe = QuantPipeline.from_pretrained(
+        pipeline_cls,
+        args.model,
+        unet=unet,
+        torch_dtype=torch.float16,
+        variant=args.variant,
+        use_safetensors=True,
+    )
 else:
     pipe = QuantPipeline.from_pretrained(
         pipeline_cls,