-
Notifications
You must be signed in to change notification settings - Fork 525
Description
Git commit
Operating System & Version
Windows 11
GGML backends
CUDA
Command-line arguments used
sd-cli.exe -v --mmap --steps 5 --diffusion-model ..\models\diff\z_image_turbo-Q4_K.gguf --llm ..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf --vae ..\models\vae\pig_flux_vae_fp32-f16.gguf --diffusion-fa --rng cpu --sampler-rng cpu --clip-on-cpu --vae-tiling --cfg-scale 1.0 -H 512 -W 512 --output test.png -p "A paper dragon"
Steps to reproduce
run sd-cli.exe
What you expected to happen
.png generated (as for commit f957fa3)
What actually happened
crashed
Logs / error messages / stack trace
d:\bin\sdcpp\cuda>sd-cli.exe -v --mmap --steps 5 --diffusion-model ..\models\diff\z_image_turbo-Q4_K.gguf --llm ..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf --vae ..\models\vae\pig_flux_vae_fp32-f16.gguf --diffusion-fa --rng cpu --sampler-rng cpu --clip-on-cpu --vae-tiling --cfg-scale 1.0 -H 512 -W 512 --output test.png -p "A paper dragon"
[DEBUG] main.cpp:500 - version: stable-diffusion.cpp version unknown, commit 65891d7
[DEBUG] main.cpp:501 - System Info:
SSE3 = 1 | AVX = 1 | AVX2 = 1 | AVX512 = 1 | AVX512_VBMI = 0 | AVX512_VNNI = 0 | FMA = 1 | NEON = 0 | ARM_FMA = 0 | F16C = 1 | FP16_VA = 0 | WASM_SIMD = 0 | VSX = 0 |
[DEBUG] main.cpp:502 - SDCliParams {
mode: img_gen,
output_path: "test.png",
verbose: true,
color: false,
canny_preprocess: false,
convert_name: false,
preview_method: none,
preview_interval: 1,
preview_path: "preview.png",
preview_fps: 16,
taesd_preview: false,
preview_noisy: false
}
[DEBUG] main.cpp:503 - SDContextParams {
n_threads: 6,
model_path: "",
clip_l_path: "",
clip_g_path: "",
clip_vision_path: "",
t5xxl_path: "",
llm_path: "..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf",
llm_vision_path: "",
diffusion_model_path: "..\models\diff\z_image_turbo-Q4_K.gguf",
high_noise_diffusion_model_path: "",
vae_path: "..\models\vae\pig_flux_vae_fp32-f16.gguf",
taesd_path: "",
esrgan_path: "",
control_net_path: "",
embedding_dir: "",
embeddings: {
}
wtype: NONE,
tensor_type_rules: "",
lora_model_dir: ".",
photo_maker_path: "",
rng_type: cpu,
sampler_rng_type: cpu,
flow_shift: INF
offload_params_to_cpu: false,
enable_mmap: true,
control_net_cpu: false,
clip_on_cpu: true,
vae_on_cpu: false,
flash_attn: false,
diffusion_flash_attn: true,
diffusion_conv_direct: false,
vae_conv_direct: false,
circular: false,
circular_x: false,
circular_y: false,
chroma_use_dit_mask: true,
qwen_image_zero_cond_t: false,
chroma_use_t5_mask: false,
chroma_t5_mask_pad: 1,
prediction: NONE,
lora_apply_mode: auto,
vae_tiling_params: { 1, 0, 0, 0.5, 0, 0 },
force_sdxl_vae_conv_scale: false
}
[DEBUG] main.cpp:504 - SDGenerationParams {
loras: "{
}",
high_noise_loras: "{
}",
prompt: "A paper dragon",
negative_prompt: "",
clip_skip: -1,
width: 512,
height: 512,
batch_count: 1,
init_image_path: "",
end_image_path: "",
mask_image_path: "",
control_image_path: "",
ref_image_paths: [],
control_video_path: "",
auto_resize_ref_image: true,
increase_ref_index: false,
pm_id_images_dir: "",
pm_id_embed_path: "",
pm_style_strength: 20,
skip_layers: [7, 8, 9],
sample_params: (txt_cfg: 1.00, img_cfg: 1.00, distilled_guidance: 3.50, slg.layer_count: 3, slg.layer_start: 0.01, slg.layer_end: 0.20, slg.scale: 0.00, scheduler: NONE, sample_method: NONE, sample_steps: 5, eta: 0.00, shifted_timestep: 0),
high_noise_skip_layers: [7, 8, 9],
high_noise_sample_params: (txt_cfg: 7.00, img_cfg: 7.00, distilled_guidance: 3.50, slg.layer_count: 3, slg.layer_start: 0.01, slg.layer_end: 0.20, slg.scale: 0.00, scheduler: NONE, sample_method: NONE, sample_steps: 20, eta: 0.00, shifted_timestep: 0),
custom_sigmas: [],
cache_mode: "",
cache_option: "",
cache: disabled (threshold=1, start=0.15, end=0.95),
moe_boundary: 0.875,
video_frames: 1,
fps: 16,
vace_strength: 1,
strength: 0.75,
control_strength: 0.9,
seed: 42,
upscale_repeats: 1,
upscale_tile_size: 128,
}
[DEBUG] stable-diffusion.cpp:166 - Using CUDA backend
[INFO ] ggml_extend.hpp:78 - ggml_cuda_init: found 1 CUDA devices:
[INFO ] ggml_extend.hpp:78 - Device 0: NVIDIA GeForce GTX 1070, compute capability 6.1, VMM: yes
[INFO ] stable-diffusion.cpp:260 - loading diffusion model from '..\models\diff\z_image_turbo-Q4_K.gguf'
[INFO ] model.cpp:370 - load ..\models\diff\z_image_turbo-Q4_K.gguf using gguf format
[DEBUG] model.cpp:416 - init from '..\models\diff\z_image_turbo-Q4_K.gguf'
[INFO ] stable-diffusion.cpp:307 - loading llm from '..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf'
[INFO ] model.cpp:370 - load ..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf using gguf format
[DEBUG] model.cpp:416 - init from '..\models\llm\Qwen3-4B-Instruct-2507-Q8_0.gguf'
[INFO ] stable-diffusion.cpp:321 - loading vae from '..\models\vae\pig_flux_vae_fp32-f16.gguf'
[INFO ] model.cpp:370 - load ..\models\vae\pig_flux_vae_fp32-f16.gguf using gguf format
[DEBUG] model.cpp:416 - init from '..\models\vae\pig_flux_vae_fp32-f16.gguf'
[INFO ] stable-diffusion.cpp:337 - Version: Z-Image
[INFO ] stable-diffusion.cpp:365 - Weight type stat: f32: 570 | f16: 70 | q8_0: 275 | q4_K: 180
[INFO ] stable-diffusion.cpp:366 - Conditioner weight type stat: f32: 145 | q8_0: 253
[INFO ] stable-diffusion.cpp:367 - Diffusion model weight type stat: f32: 251 | q8_0: 22 | q4_K: 180
[INFO ] stable-diffusion.cpp:368 - VAE weight type stat: f32: 174 | f16: 70
[DEBUG] stable-diffusion.cpp:370 - ggml tensor size = 400 bytes
[INFO ] stable-diffusion.cpp:429 - CLIP: Using CPU backend
d:\bin\sdcpp\cuda>
Additional context / environment details
i7-8700, GTX 1070 8GB, RAM 64 GB