Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
661021a
trt dynamic scale
ryanontheinside Aug 8, 2025
552cd0f
move trt attn to diffusers ipadapter
ryanontheinside Aug 8, 2025
ced21f3
support weight types
ryanontheinside Aug 8, 2025
1da29d9
add ipadapter hooks
ryanontheinside Aug 8, 2025
1433e71
add controlnet module
ryanontheinside Aug 8, 2025
e650cae
cleanup pipeline
ryanontheinside Aug 8, 2025
548c120
integration with fallback shims
ryanontheinside Aug 9, 2025
e47f1d9
conrolnet updates and ordering
ryanontheinside Aug 9, 2025
c4938d6
update lock
ryanontheinside Aug 9, 2025
b6a4143
deprecate config methods
ryanontheinside Aug 9, 2025
373bddb
fix feedback
ryanontheinside Aug 9, 2025
c8bb03f
remove IPAdapterPipeline reference trt
ryanontheinside Aug 9, 2025
b20960e
cleanup deprecations
ryanontheinside Aug 9, 2025
5ff7c8e
sdxl controlnet fix
ryanontheinside Aug 9, 2025
b2cb3b6
IPA: remove scale from engine path, pre install attn
ryanontheinside Aug 9, 2025
1149d7e
fix controlnet compile and runtime trt
ryanontheinside Aug 9, 2025
39a68a9
remove legacy code
ryanontheinside Aug 9, 2025
7c28af1
ipadapter->hook, remove shims
ryanontheinside Aug 9, 2025
de9f725
remove shim use from demos
ryanontheinside Aug 9, 2025
d45bf3e
consolidate demos and configs
ryanontheinside Aug 9, 2025
17a883c
ensure preprocessing paralellism
ryanontheinside Aug 9, 2025
0937ae7
remove legacy update methods
ryanontheinside Aug 9, 2025
fcac228
unified getter for stream state
ryanontheinside Aug 9, 2025
924f2c9
fix resolution endpoint
ryanontheinside Aug 9, 2025
4d4ea68
cache pipelining check
ryanontheinside Aug 12, 2025
06fd221
todo
ryanontheinside Aug 12, 2025
b0fcdd2
cache controlimage per frame
ryanontheinside Aug 12, 2025
9d8abf0
reuse prepro orchestrator
ryanontheinside Aug 12, 2025
0462187
cleaner controlnet caching
ryanontheinside Aug 13, 2025
5804973
blurry output
ryanontheinside Aug 10, 2025
b497bd7
working sans controlnet
ryanontheinside Aug 11, 2025
f3514f8
ui fix
ryanontheinside Aug 11, 2025
93f71cc
removet2i cache
ryanontheinside Aug 11, 2025
5049faa
t2i update from demo
ryanontheinside Aug 11, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
54 changes: 0 additions & 54 deletions configs/prompt_blending_demo.yaml.example

This file was deleted.

45 changes: 0 additions & 45 deletions configs/sd15_canny_depth.yaml.example

This file was deleted.

42 changes: 0 additions & 42 deletions configs/sd15_depth_trt_example.yaml.example

This file was deleted.

74 changes: 74 additions & 0 deletions configs/sd15_multicontrol.yaml.example
Original file line number Diff line number Diff line change
@@ -0,0 +1,74 @@
# StreamDiffusion SD1.5 Multi-ControlNet + IPAdapter Configuration
# Demonstrates: TensorRT depth processing, tile with feedback, and IPAdapter integration

# Base model configuration (use HuggingFace model or local path)
model_id: "KBlueLeaf/kohaku-v2.1"
# model_id: "C:\\_dev\\models\\your_sd15_model.safetensors"

# StreamDiffusion core parameters
t_index_list: [16, 32] # Denoising timesteps - lower values = less denoising
width: 512
height: 512
device: "cuda"
dtype: "float16"

# Generation parameters
# prompt: "masterpiece, high quality, detailed, cinematic lighting" # Overridden by prompt_blending below

# Prompt blending configuration - interpolates between multiple prompts
prompt_blending:
prompt_list:
- ["masterpiece, studio ghibli style, detailed anime artwork", 1.0]
- ["cyberpunk aesthetic, neon lights, futuristic", 0.3]
interpolation_method: "slerp" # or "linear"
enable_caching: true

negative_prompt: "blurry, low quality, distorted, 3d render"
guidance_scale: 1.1
num_inference_steps: 50
seed: 789

# Temporal consistency and optimization
frame_buffer_size: 1
delta: 0.7
use_denoising_batch: true
use_lcm_lora: true
use_tiny_vae: true
acceleration: "tensorrt" # "xformers" for non-TensorRT setups
cfg_type: "self"

# Engine directory for TensorRT (engines will be built here if not found)
engine_dir: "./engines/sd15"

# Enable multi-modal conditioning
use_controlnet: true
use_ipadapter: true

# IPAdapter configuration for style conditioning
ipadapters:
- ipadapter_model_path: "h94/IP-Adapter/models/ip-adapter_sd15.safetensors"
image_encoder_path: "h94/IP-Adapter/models/image_encoder"
# style_image: "path/to/your/style/image.jpg" # Optional: specify style image
scale: 0.7
enabled: true

# ControlNet configurations
controlnets:
# TensorRT Depth ControlNet (requires TensorRT engine)
- model_id: "lllyasviel/control_v11f1p_sd15_depth"
conditioning_scale: 0.3
preprocessor: "depth_tensorrt"
preprocessor_params:
engine_path: "C:\\_dev\\models\\tensorrt\\depth_anything_v2_vits-fp16.engine" # REQUIRED: Path to TensorRT engine
detect_resolution: 518 # Must match engine input size
image_resolution: 512
enabled: true

# Tile ControlNet with feedback processor for temporal consistency
- model_id: "lllyasviel/control_v11f1e_sd15_tile"
conditioning_scale: 0.2
preprocessor: "feedback"
preprocessor_params:
image_resolution: 512
feedback_strength: 0.15 # Controls temporal feedback intensity
enabled: true
28 changes: 0 additions & 28 deletions configs/sd15_tile.yaml.example

This file was deleted.

33 changes: 0 additions & 33 deletions configs/sdturbo_color.yaml.example

This file was deleted.

51 changes: 0 additions & 51 deletions configs/sdturbo_mediapipe_pose_depth_trt.yaml.example

This file was deleted.

57 changes: 57 additions & 0 deletions configs/sdturbo_multicontrol.yaml.example
Original file line number Diff line number Diff line change
@@ -0,0 +1,57 @@
# StreamDiffusion SD-Turbo Multi-ControlNet Configuration
# Demonstrates: Fast inference with multiple ControlNet guidance (no IPAdapter for speed)

# Base model configuration
model_id: "stabilityai/sd-turbo"

# StreamDiffusion core parameters
t_index_list: [0, 16] # SD-Turbo optimized timesteps
width: 512
height: 512
device: "cuda"
dtype: "float16"

# Generation parameters
prompt: "masterpiece, high quality, detailed anime character"
negative_prompt: "blurry, low quality, distorted, 3d render"
guidance_scale: 1.0 # SD-Turbo typically uses lower guidance
num_inference_steps: 4 # SD-Turbo optimized for few steps
seed: 789

# Temporal consistency and optimization
frame_buffer_size: 1
delta: 0.7
use_denoising_batch: true
use_lcm_lora: true # SD-Turbo benefits from LCM LoRA
use_tiny_vae: true
acceleration: "tensorrt" # "xformers" for non-TensorRT setups
cfg_type: "self"

# Engine directory for TensorRT
engine_dir: "./engines/sdturbo"

# Enable ControlNet (no IPAdapter for maximum speed)
use_controlnet: true

# ControlNet configurations
controlnets:
# Canny edge detection for structural guidance
- model_id: "thibaud/controlnet-sd21-canny-diffusers"
conditioning_scale: 0.5
preprocessor: "canny"
preprocessor_params:
low_threshold: 100
high_threshold: 200
enabled: true

# Soft edge detection for artistic guidance
- model_id: "thibaud/controlnet-sd21-hed-diffusers"
conditioning_scale: 0.3
preprocessor: "soft_edge"
preprocessor_params:
image_resolution: 512
strength: 1.0
soft_threshold: 0.5
multi_scale: true
gaussian_sigma: 1.0
enabled: true
Loading