Anima

Anima 是什么？

Anima 是由 CircleStone Labs 与 Comfy Org 合作创建的，2B 参数图像生成模型。

它以 NVIDIA Cosmos 为基础，是使用数百万张动漫图像和艺术图像训练的 纯动漫模型。

作为从 SDXL 世代的动漫模型迁移过去的目标之一，Anima 受到了相当多的期待。

许可证是 CircleStone Labs Non-Commercial License。
Anima 模型本身、派生模型和 LoRA 等为非商业用途。生成图像可以用于商业用途。

模型下载

diffusion_models
- anima-base-v1.0.safetensors (4.18 GB)
text_encoders
- qwen_3_06b_base.safetensors (1.19 GB)
vae
- qwen_image_vae.safetensors (254 MB)

📂ComfyUI/
└── 📂models/
    ├── 📂diffusion_models/
    │   └── anima-base-v1.0.safetensors
    ├── 📂text_encoders/
    │   └── qwen_3_06b_base.safetensors
    └── 📂vae/
        └── qwen_image_vae.safetensors

提示词

Anima 使用 Danbooru 系标签、自然语言，以及两者的组合进行训练。

因为文本编码器比较聪明，所以不需要像 Pony Diffusion V6 那样严格，不过在提示词开头加上下面这样的质量标签，可能会比较好用。

masterpiece, best quality, score_9, safe,

text2image

anima-base-v1.0.json

{
  "id": "d8034549-7e0a-40f1-8c2e-de3ffc6f1cae",
  "revision": 0,
  "last_node_id": 72,
  "last_link_id": 121,
  "nodes": [
    {
      "id": 54,
      "type": "ModelSamplingAuraFlow",
      "pos": [
        603.9390258789062,
        45.71437377929687
      ],
      "size": [
        230.33058166503906,
        58
      ],
      "flags": {},
      "order": 5,
      "mode": 0,
      "inputs": [
        {
          "name": "model",
          "type": "MODEL",
          "link": 99
        }
      ],
      "outputs": [
        {
          "name": "MODEL",
          "type": "MODEL",
          "links": [
            100
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.49",
        "Node name for S&R": "ModelSamplingAuraFlow"
      },
      "widgets_values": [
        3
      ]
    },
    {
      "id": 56,
      "type": "SaveImage",
      "pos": [
        1443.3798111474612,
        188.1918182373047
      ],
      "size": [
        840.8608467636989,
        696.6737191157355
      ],
      "flags": {},
      "order": 10,
      "mode": 0,
      "inputs": [
        {
          "name": "images",
          "type": "IMAGE",
          "link": 101
        }
      ],
      "outputs": [],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.75"
      },
      "widgets_values": [
        "ComfyUI"
      ]
    },
    {
      "id": 8,
      "type": "VAEDecode",
      "pos": [
        1252.432861328125,
        188.1918182373047
      ],
      "size": [
        157.56002807617188,
        46
      ],
      "flags": {},
      "order": 9,
      "mode": 0,
      "inputs": [
        {
          "name": "samples",
          "type": "LATENT",
          "link": 35
        },
        {
          "name": "vae",
          "type": "VAE",
          "link": 76
        }
      ],
      "outputs": [
        {
          "name": "IMAGE",
          "type": "IMAGE",
          "slot_index": 0,
          "links": [
            101
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "VAEDecode"
      },
      "widgets_values": []
    },
    {
      "id": 37,
      "type": "UNETLoader",
      "pos": [
        267.6552734375,
        45.71437377929687
      ],
      "size": [
        305.3782043457031,
        82
      ],
      "flags": {},
      "order": 0,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "MODEL",
          "type": "MODEL",
          "slot_index": 0,
          "links": [
            99
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "UNETLoader"
      },
      "widgets_values": [
        "anima-base-v1.0.safetensors",
        "default"
      ],
      "color": "#323",
      "bgcolor": "#535"
    },
    {
      "id": 71,
      "type": "MarkdownNote",
      "pos": [
        -139.29483075353875,
        -55.59164398492874
      ],
      "size": [
        361.4596634874822,
        279.1595832744705
      ],
      "flags": {},
      "order": 1,
      "mode": 0,
      "inputs": [],
      "outputs": [],
      "properties": {},
      "widgets_values": [
        "## models\n\n* diffusion_models\n\n  * [anima-base-v1.0.safetensors](https://huggingface.co/circlestone-labs/Anima/blob/main/split_files/diffusion_models/anima-base-v1.0.safetensors) (4.18 GB)\n\n* text_encoders\n\n  * [qwen_3_06b_base.safetensors](https://huggingface.co/circlestone-labs/Anima/blob/main/split_files/text_encoders/qwen_3_06b_base.safetensors) (1.19 GB)\n\n* vae\n\n  * [qwen_image_vae.safetensors](https://huggingface.co/circlestone-labs/Anima/blob/main/split_files/vae/qwen_image_vae.safetensors) (254 MB)\n\n```text\n📂ComfyUI/\n└── 📂models/\n    ├── 📂diffusion_models/\n    │   └── anima-base-v1.0.safetensors\n    ├── 📂text_encoders/\n    │   └── qwen_3_06b_base.safetensors\n    └── 📂vae/\n        └── qwen_image_vae.safetensors\n```"
      ],
      "color": "#323",
      "bgcolor": "#535"
    },
    {
      "id": 38,
      "type": "CLIPLoader",
      "pos": [
        56.288665771484375,
        312.74468994140625
      ],
      "size": [
        301.3524169921875,
        106
      ],
      "flags": {},
      "order": 2,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "CLIP",
          "type": "CLIP",
          "slot_index": 0,
          "links": [
            74,
            75
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "CLIPLoader"
      },
      "widgets_values": [
        "qwen_3_06b_base.safetensors",
        "stable_diffusion",
        "default"
      ],
      "color": "#432",
      "bgcolor": "#653"
    },
    {
      "id": 39,
      "type": "VAELoader",
      "pos": [
        977.9548217773436,
        69.71437377929689
      ],
      "size": [
        235.80000000000018,
        58
      ],
      "flags": {},
      "order": 3,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "VAE",
          "type": "VAE",
          "slot_index": 0,
          "links": [
            76
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "VAELoader"
      },
      "widgets_values": [
        "qwen_image_vae.safetensors"
      ],
      "color": "#322",
      "bgcolor": "#533"
    },
    {
      "id": 60,
      "type": "EmptyLatentImage",
      "pos": [
        597.2695922851562,
        584.737218645886
      ],
      "size": [
        237,
        106
      ],
      "flags": {},
      "order": 4,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "LATENT",
          "type": "LATENT",
          "links": [
            103
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.40",
        "Node name for S&R": "EmptyLatentImage"
      },
      "widgets_values": [
        1152,
        896,
        1
      ]
    },
    {
      "id": 7,
      "type": "CLIPTextEncode",
      "pos": [
        413.60047785937076,
        403.99281184374564
      ],
      "size": [
        419.26959228515625,
        107.08506774902344
      ],
      "flags": {
        "collapsed": false
      },
      "order": 7,
      "mode": 0,
      "inputs": [
        {
          "name": "clip",
          "type": "CLIP",
          "link": 75
        }
      ],
      "outputs": [
        {
          "name": "CONDITIONING",
          "type": "CONDITIONING",
          "slot_index": 0,
          "links": [
            52
          ]
        }
      ],
      "title": "CLIP Text Encode (Negative Prompt)",
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "CLIPTextEncode"
      },
      "widgets_values": [
        "worst quality, low quality, score_1, close-up face only, portrait crop, poolside, float ring, beach ball, toy boat, water gun, chibi, giant eyes, thick lineart, western comic, photorealistic, 3d, cgi, painterly, watercolor, muddy colors, neon colors, text, logo, watermark, looking at viewer"
      ]
    },
    {
      "id": 6,
      "type": "CLIPTextEncode",
      "pos": [
        415.00001525878906,
        186
      ],
      "size": [
        419.26959228515625,
        156.00363159179688
      ],
      "flags": {},
      "order": 6,
      "mode": 0,
      "inputs": [
        {
          "name": "clip",
          "type": "CLIP",
          "link": 74
        }
      ],
      "outputs": [
        {
          "name": "CONDITIONING",
          "type": "CONDITIONING",
          "slot_index": 0,
          "links": [
            46
          ]
        }
      ],
      "title": "CLIP Text Encode (Positive Prompt)",
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "CLIPTextEncode"
      },
      "widgets_values": [
        "safe, masterpiece, best quality, score_9, score_8_up, anime screenshot, modern japanese illustration, high quality anime key visual, clean thin lineart, delicate linework, restrained line weight, refined anatomy, elegant proportions, slightly sharp face, narrow expressive eyes, subtle eyelashes, small nose, soft blush, muted but vivid colors, rich summer colors, bright but controlled saturation, dusty teal shadows, warm orange highlights, golden summer sunlight, soft cel shading, reduced palette, beautiful reflected light, beautiful window reflections, beautiful street reflections, emotional lighting, calm graphic balance, polished rendering,\n\n1girl, solo, giant japanese high school girl, school uniform, summer uniform, short sleeve blouse, pleated skirt, loose socks, loafers, drinking a frappuccino from a clear plastic cup with a straw, candid pose, natural posture, relaxed expression, slightly amused, not looking at viewer, no eye contact, looking to the side, look side, looking down toward the city, face turned away from camera, side profile feeling,\n\nclose high oblique view, near aerial angle, medium wide shot, the camera is close to the giant girl, the girl dominates the composition, large foreground character, her upper body and legs are clearly visible, she occupies about half of the image height, enormous scale contrast, miniature Tokyo-like city below and behind her,\n\nShe is casually sitting on the edge of a tall building, leaning lightly against another nearby building as if it were a wall. The city below is tiny compared to her. The moment feels ordinary to her but absurd to the viewer, like a quiet summer afternoon in an impossible world.\n\nA richly rendered Tokyo-like summer city spreads below her, dense but readable: sunlit rooftops, narrow streets, train tracks, rooftop machinery, glass windows, signs, tiny cars, intersections, convenience-store-like corners, vending machines, and layered buildings. The background has the richness of an anime film background, with detailed architecture, warm sunlight, blue-green shadows, bright reflected light, and a vivid summer atmosphere.\n\nKeep the character clean and elegant with thin anime lineart and soft cel shading, while the city background is richer, more textured, and more detailed. The contrast between the clean character and the dense vivid city is important. The image should feel natural, funny, and surreal at the same time, not like a posed pinup.\n\nsummer daylight, blue sky feeling, hot summer air, sunlit concrete, saturated teal shadows, warm peach highlights, sparkling window reflections, bright rooftop highlights, soft atmospheric depth, colorful but not garish, calm whimsical mood"
      ]
    },
    {
      "id": 3,
      "type": "KSampler",
      "pos": [
        898.7548217773438,
        188.1918182373047
      ],
      "size": [
        315,
        262
      ],
      "flags": {},
      "order": 8,
      "mode": 0,
      "inputs": [
        {
          "name": "model",
          "type": "MODEL",
          "link": 100
        },
        {
          "name": "positive",
          "type": "CONDITIONING",
          "link": 46
        },
        {
          "name": "negative",
          "type": "CONDITIONING",
          "link": 52
        },
        {
          "name": "latent_image",
          "type": "LATENT",
          "link": 103
        }
      ],
      "outputs": [
        {
          "name": "LATENT",
          "type": "LATENT",
          "slot_index": 0,
          "links": [
            35
          ]
        }
      ],
      "properties": {
        "cnr_id": "comfy-core",
        "ver": "0.3.33",
        "Node name for S&R": "KSampler"
      },
      "widgets_values": [
        1234,
        "fixed",
        30,
        4,
        "er_sde",
        "simple",
        1
      ]
    }
  ],
  "links": [
    [
      35,
      3,
      0,
      8,
      0,
      "LATENT"
    ],
    [
      46,
      6,
      0,
      3,
      1,
      "CONDITIONING"
    ],
    [
      52,
      7,
      0,
      3,
      2,
      "CONDITIONING"
    ],
    [
      74,
      38,
      0,
      6,
      0,
      "CLIP"
    ],
    [
      75,
      38,
      0,
      7,
      0,
      "CLIP"
    ],
    [
      76,
      39,
      0,
      8,
      1,
      "VAE"
    ],
    [
      99,
      37,
      0,
      54,
      0,
      "MODEL"
    ],
    [
      100,
      54,
      0,
      3,
      0,
      "MODEL"
    ],
    [
      101,
      8,
      0,
      56,
      0,
      "IMAGE"
    ],
    [
      103,
      60,
      0,
      3,
      3,
      "LATENT"
    ]
  ],
  "groups": [],
  "config": {},
  "extra": {
    "ds": {
      "scale": 0.6830134553650707,
      "offset": [
        334.6282433711493,
        334.46305304151196
      ]
    },
    "frontendVersion": "1.44.19",
    "VHS_latentpreview": false,
    "VHS_latentpreviewrate": 0,
    "VHS_MetadataImage": true,
    "VHS_KeepIntermediate": true
  },
  "version": 0.4
}

推荐分辨率是 512px 到 1536px。
推荐使用 er_sde 或 euler_ancestral 这样带有一点随机变化的采样器。

Anima

Anima 是什么？

模型下载

提示词

text2image

什么是 JSON 复制按钮？

这个页面有问题！

请补充讲解！

感想 / 其他

感谢！