Skip to content

Commit c9e92cd

Browse files
committed
model sorter organization
1 parent 99d4d8b commit c9e92cd

File tree

2 files changed

+27
-22
lines changed

2 files changed

+27
-22
lines changed

docs/Model Support.md

+6-4
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
[Stable Cascade](#stable-cascade) | unet cascade | 2024 | Stability AI | 5B | Outdated |
1414
[PixArt Sigma](#pixart-sigma) | DiT | 2024 | PixArt | 1B | Outdated |
1515
[Nvidia Sana](#nvidia-sana) | DiT | 2024 | NVIDIA | 1.6B | Modern, Low Quality |
16-
[AuraFlow v0.1 and v0.2](#auraflow-v01) | MMDiT | 2024 | Fal.AI | 6B | Outdated |
16+
[AuraFlow](#auraflow) | MMDiT | 2024 | Fal.AI | 6B | Outdated |
1717
[Flux.1](#black-forest-labs-flux1-models) | MMDiT | 2024 | Black Forest Labs | 12B | Modern, High Quality |
1818
[Lumina 2.0](#lumina-2) | NextDiT | 2025 | Alpha-VLLM | 2.6B | Modern, Decent Quality |
1919

@@ -157,14 +157,16 @@ These steps are not friendly to beginners (if Sana gains popularity, likely more
157157
- Only Sana 1600M 1024 has been validated currently
158158
- use a CFG around 4
159159

160-
# AuraFlow v0.1
160+
# AuraFlow
161161

162162
![img](/docs/images/models/auraflow-02.jpg)
163163
*(above image is AuraFlow v0.2)*
164164

165-
[Fal.ai's AuraFlow v0.1](https://huggingface.co/fal/AuraFlow/tree/main) and [v0.2](https://huggingface.co/fal/AuraFlow-v0.2) is supported in Swarm, but you must manually select architecture to use it. (The AuraFlow team said they intend to add modelspec metadata in the future).
165+
[Fal.ai's AuraFlow v0.1](https://huggingface.co/fal/AuraFlow/tree/main) and [v0.2](https://huggingface.co/fal/AuraFlow-v0.2) and v0.3 are supported in Swarm, but you must manually select architecture to use it.
166166

167-
Download the model, then click "`Edit Metadata`" and select `(Temporary) AuraFlow` as the architecture, and set resolution to `1024x1024`.
167+
Download the model, then click "`Edit Metadata`" and select `AuraFlow` as the architecture, and set resolution to `1024x1024`.
168+
169+
Parameters and usage is the same as any other normal model.
168170

169171
# Black Forest Labs' Flux.1 Models
170172

src/Text2Image/T2IModelClassSorter.cs

+21-18
Original file line numberDiff line numberDiff line change
@@ -328,15 +328,7 @@ JToken GetEmbeddingKey(JObject h)
328328
{
329329
return isWan21_14b(h) && isWanI2v(h);
330330
}});
331-
// ====================== Random Other Models ======================
332-
Register(new() { ID = "alt_diffusion_v1_512_placeholder", CompatClass = "alt_diffusion_v1", Name = "Alt-Diffusion", StandardWidth = 512, StandardHeight = 512, IsThisModelOfClass = (m, h) =>
333-
{
334-
return IsAlt(h);
335-
}});
336-
Register(new() { ID = "lightricks-ltx-video", CompatClass = "lightricks-ltx-video", Name = "Lightricks LTX Video", StandardWidth = 768, StandardHeight = 512, IsThisModelOfClass = (m, h) =>
337-
{
338-
return isLtxv(h);
339-
}});
331+
// ====================== Hunyuan Video ======================
340332
Register(new() { ID = "hunyuan-video", CompatClass = "hunyuan-video", Name = "Hunyuan Video", StandardWidth = 720, StandardHeight = 720, IsThisModelOfClass = (m, h) =>
341333
{
342334
return isHunyuanVideo(h) && !isHunyuanVideoNativeImage2V(h);
@@ -365,14 +357,7 @@ JToken GetEmbeddingKey(JObject h)
365357
{
366358
return isHunyuanVideoLora(h);
367359
}});
368-
Register(new() { ID = "nvidia-sana-1600", CompatClass = "nvidia-sana-1600", Name = "NVIDIA Sana 1600M", StandardWidth = 1024, StandardHeight = 1024, IsThisModelOfClass = (m, h) =>
369-
{
370-
return isSana(h);
371-
}});
372-
Register(new() { ID = "nvidia-sana-1600/vae", CompatClass = "nvidia-sana-1600", Name = "NVIDIA Sana 1600M DC-AE VAE", StandardWidth = 1024, StandardHeight = 1024, IsThisModelOfClass = (m, h) =>
373-
{
374-
return h.ContainsKey("decoder.stages.0.0.main.conv.bias");
375-
}});
360+
// ====================== Nvidia Cosmos ======================
376361
Register(new() { ID = "nvidia-cosmos-1-7b-text2world", CompatClass = "nvidia-cosmos-1", Name = "NVIDIA Cosmos 1.0 Diffusion (7B) Text2World", StandardWidth = 960, StandardHeight = 960, IsThisModelOfClass = (m, h) =>
377362
{
378363
return isCosmos7b(h) && (int)h["net.x_embedder.proj.1.weight"]["shape"].ToArray()[^1].Value<long>() == 68;
@@ -393,11 +378,29 @@ JToken GetEmbeddingKey(JObject h)
393378
{
394379
return isCosmosVae(h);
395380
}});
381+
// ====================== Random Other Models ======================
382+
Register(new() { ID = "alt_diffusion_v1_512_placeholder", CompatClass = "alt_diffusion_v1", Name = "Alt-Diffusion", StandardWidth = 512, StandardHeight = 512, IsThisModelOfClass = (m, h) =>
383+
{
384+
return IsAlt(h);
385+
}});
386+
Register(new() { ID = "lightricks-ltx-video", CompatClass = "lightricks-ltx-video", Name = "Lightricks LTX Video", StandardWidth = 768, StandardHeight = 512, IsThisModelOfClass = (m, h) =>
387+
{
388+
return isLtxv(h);
389+
}});
390+
Register(new() { ID = "nvidia-sana-1600", CompatClass = "nvidia-sana-1600", Name = "NVIDIA Sana 1600M", StandardWidth = 1024, StandardHeight = 1024, IsThisModelOfClass = (m, h) =>
391+
{
392+
return isSana(h);
393+
}});
394+
Register(new() { ID = "nvidia-sana-1600/vae", CompatClass = "nvidia-sana-1600", Name = "NVIDIA Sana 1600M DC-AE VAE", StandardWidth = 1024, StandardHeight = 1024, IsThisModelOfClass = (m, h) =>
395+
{
396+
return h.ContainsKey("decoder.stages.0.0.main.conv.bias");
397+
}});
396398
Register(new() { ID = "lumina-2", CompatClass = "lumina-2", Name = "Lumina 2", StandardWidth = 1024, StandardHeight = 1024, IsThisModelOfClass = (m, h) =>
397399
{
398400
return isLumina2(h);
399401
}});
400-
// Everything below this point does not autodetect, it must match through ModelSpec
402+
// ====================== Everything below this point does not autodetect, it must match through ModelSpec or be manually set ======================
403+
// General Stable Diffusion variants
401404
Register(new() { ID = "stable-diffusion-v1/vae", CompatClass = "stable-diffusion-v1", Name = "Stable Diffusion v1 VAE", StandardWidth = 512, StandardHeight = 512, IsThisModelOfClass = (m, h) => { return false; } });
402405
Register(new() { ID = "stable-diffusion-v1/inpaint", CompatClass = "stable-diffusion-v1", Name = "Stable Diffusion v1 (Inpainting)", StandardWidth = 512, StandardHeight = 512, IsThisModelOfClass = (m, h) => { return false; } });
403406
Register(new() { ID = "stable-diffusion-v2-768-v/lora", CompatClass = "stable-diffusion-v2", Name = "Stable Diffusion v2 LoRA", StandardWidth = 768, StandardHeight = 768, IsThisModelOfClass = (m, h) => { return false; } });

0 commit comments

Comments
 (0)