Update README.md
Browse files
README.md
CHANGED
@@ -6,41 +6,20 @@ base_model:
|
|
6 |
- Qwen/Qwen-Image
|
7 |
pipeline_tag: text-to-image
|
8 |
library_name: diffusers
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9 |
---
|
10 |
# **gguf quantized version of qwen-image**
|
11 |
-
-
|
12 |
-
|
13 |
-
|
14 |
-
from diffusers import DiffusionPipeline, GGUFQuantizationConfig, QwenImageTransformer2DModel
|
15 |
|
16 |
-
|
17 |
-
transformer = QwenImageTransformer2DModel.from_single_file(
|
18 |
-
model_path,
|
19 |
-
quantization_config=GGUFQuantizationConfig(compute_dtype=torch.bfloat16),
|
20 |
-
torch_dtype=torch.bfloat16,
|
21 |
-
config="callgg/qi-decoder",
|
22 |
-
subfolder="transformer"
|
23 |
-
)
|
24 |
-
|
25 |
-
pipe = DiffusionPipeline.from_pretrained(
|
26 |
-
"callgg/qi-decoder",
|
27 |
-
transformer=transformer,
|
28 |
-
torch_dtype=torch.bfloat16,
|
29 |
-
)
|
30 |
-
pipe.enable_model_cpu_offload()
|
31 |
-
|
32 |
-
prompt = "a pig holding a sign that says hello world"
|
33 |
-
positive_magic = {"en": "Ultra HD, 4K, cinematic composition."}
|
34 |
-
negative_prompt = " "
|
35 |
-
|
36 |
-
image = pipe(
|
37 |
-
prompt=prompt + positive_magic["en"],
|
38 |
-
negative_prompt=negative_prompt,
|
39 |
-
height=1024,
|
40 |
-
width=1024,
|
41 |
-
num_inference_steps=24,
|
42 |
-
true_cfg_scale=2.5,
|
43 |
-
generator=torch.Generator().manual_seed(0)
|
44 |
-
).images[0]
|
45 |
-
image.save("output.png")
|
46 |
-
```
|
|
|
6 |
- Qwen/Qwen-Image
|
7 |
pipeline_tag: text-to-image
|
8 |
library_name: diffusers
|
9 |
+
widget:
|
10 |
+
- text: cute anime girl with massive fennec ears and a big fluffy fox tail with long wavy blonde hair between eyes and large blue eyes blonde colored eyelashes chubby wearing oversized clothes summer uniform long blue maxi skirt muddy clothes happy sitting on the side of the road in a run down dark gritty cyberpunk city with neon and a crumbling skyscraper in the rain at night while dipping her feet in a river of water she is holding a sign that says "ComfyUI is the best" written in cursive
|
11 |
+
output:
|
12 |
+
url: workflow-demo1.png
|
13 |
+
- text: cute anime girl with massive fennec ears and a big fluffy fox tail with long wavy blonde hair between eyes and large blue eyes blonde colored eyelashes chubby wearing oversized clothes summer uniform long blue maxi skirt muddy clothes happy sitting on the side of the road in a run down dark gritty cyberpunk city with neon and a crumbling skyscraper in the rain at night while dipping her feet in a river of water she is holding a sign that says "PIG is the best" written in cursive
|
14 |
+
output:
|
15 |
+
url: workflow-demo2.png
|
16 |
+
- text: cute anime girl with massive fennec ears and a big fluffy fox tail with long wavy blonde hair between eyes and large blue eyes blonde colored eyelashes chubby wearing oversized clothes summer uniform long blue maxi skirt muddy clothes happy sitting on the side of the road in a run down dark gritty cyberpunk city with neon and a crumbling skyscraper in the rain at night while dipping her feet in a river of water she is holding a sign that says "1+1=2 is it correct?" written in cursive
|
17 |
+
output:
|
18 |
+
url: workflow-demo3.png
|
19 |
---
|
20 |
# **gguf quantized version of qwen-image**
|
21 |
+
- drag **qwen-image** to > `./ComfyUI/models/diffusion_models`
|
22 |
+
- drag **qwen2.5-vl-7b** to > `./ComfyUI/models/text_encoders`
|
23 |
+
- drag **pig** to > `./ComfyUI/models/vae`
|
|
|
24 |
|
25 |
+
<Gallery />
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|