recoilme commited on Oct 31, 2025

Commit

4152a30

1 Parent(s): f52c2f8

2410

Browse files

Files changed (22) hide show

README.md +10 -6
budget.jpg → media/budget.jpg +0 -0
promo.png → media/promo.png +0 -0
result_grid.jpg → media/result_grid.jpg +0 -0
result_grid.png → media/result_grid.png +0 -0
pipeline_sdxs.py +6 -6
samples/unet_320x640_0.jpg +2 -2
samples/unet_384x640_0.jpg +2 -2
samples/unet_448x640_0.jpg +2 -2
samples/unet_512x640_0.jpg +2 -2
samples/unet_576x640_0.jpg +2 -2
samples/unet_640x320_0.jpg +2 -2
samples/unet_640x384_0.jpg +2 -2
samples/unet_640x448_0.jpg +2 -2
samples/unet_640x512_0.jpg +2 -2
samples/unet_640x576_0.jpg +2 -2
samples/unet_640x640_0.jpg +2 -2
TRAIN.md → src/TRAIN.md +0 -0
train.old.py → src/train.old.py +0 -0
test.ipynb +2 -2
train.py +1 -1
unet/diffusion_pytorch_model.safetensors +1 -1

README.md CHANGED Viewed

@@ -7,14 +7,18 @@ pipeline_tag: text-to-image
 *XS Size, Excess Quality*
-![promo](promo.png)
 At AiArtLab, we strive to create a free, compact and fast model that can be trained on consumer graphics cards.
-- 1.5b UNet
-- Qwen3-0.6b text encoder
-- 16ch Simple VAE, which preserves details and anatomy.
-- The model was trained ~3 month on 4xRTX5090 on approximately 1+ million images with various resolutions and styles, including anime and realistic photos.
 ### Example
@@ -69,4 +73,4 @@ BTC: 3JHv9Hb8kEW8zMAccdgCdZGfrHeMhH1rpN
 ## More examples
-![result_grid](result_grid.png)

 *XS Size, Excess Quality*
+![promo](media/promo.png)
 At AiArtLab, we strive to create a free, compact and fast model that can be trained on consumer graphics cards.
+- Model: 1.5b parameters
+- Text encoder: Qwen3 (0.6B parameters)
+- VAE: 8x16ch, [Simple VAE](https://huggingface.co/AiArtLab/simplevae)
+The model was trained for ~3 months on 4xRTX 5090 GPUs using over 1 million images of various resolutions and styles, primarily anime and illustrations.
+[Gradio](https://sdxs.aiartlab.org/)
 ### Example
 ## More examples
+![result_grid](media/result_grid.jpg)

budget.jpg → media/budget.jpg RENAMED Viewed

File without changes

promo.png → media/promo.png RENAMED Viewed

File without changes

result_grid.jpg → media/result_grid.jpg RENAMED Viewed

File without changes

result_grid.png → media/result_grid.png RENAMED Viewed

File without changes

pipeline_sdxs.py CHANGED Viewed

@@ -102,9 +102,9 @@ class SdxsPipeline(DiffusionPipeline):
     def generate_latents(
         self,
         text_embeddings,
-        height: int = 576,
-        width: int = 576,
-        num_inference_steps: int = 40,
         guidance_scale: float = 5.0,
         latent_channels: int = 16,
         batch_size: int = 1,
@@ -192,9 +192,9 @@ class SdxsPipeline(DiffusionPipeline):
     def __call__(
         self,
         prompt: Optional[Union[str, List[str]]] = None,
-        height: int = 576,
-        width: int = 576,
-        num_inference_steps: int = 40,
         guidance_scale: float = 5.0,
         latent_channels: int = 16,
         output_type: str = "pil",

     def generate_latents(
         self,
         text_embeddings,
+        height: int = 640,
+        width: int = 640,
+        num_inference_steps: int = 50,
         guidance_scale: float = 5.0,
         latent_channels: int = 16,
         batch_size: int = 1,
     def __call__(
         self,
         prompt: Optional[Union[str, List[str]]] = None,
+        height: int = 640,
+        width: int = 640,
+        num_inference_steps: int = 50,
         guidance_scale: float = 5.0,
         latent_channels: int = 16,
         output_type: str = "pil",

samples/unet_320x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: de70cc7677216a340eb62bf3eada0d6cad482256b5732cb4b2f88254df756773
Pointer size: 130 Bytes
Size of remote file: 67.7 kB

Git LFS Details

SHA256: dc79b17307b4869f98f2a2fc42b7b1c48ea560da9fd5b53fa5252d27952f06a6
Pointer size: 130 Bytes
Size of remote file: 32.9 kB

samples/unet_384x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 8a7e4b4ccf58eb40cd74596425d594f0a76bc0c1d33476fb59e28a5e137e3459
Pointer size: 131 Bytes
Size of remote file: 164 kB

Git LFS Details

SHA256: 92cb2525b99d951e9237387d8436ad180943120625f18a04cd522b2d2f22215b
Pointer size: 131 Bytes
Size of remote file: 206 kB

samples/unet_448x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 77d5da2186f63a0417dbdeb892d9c18a0012922d56bab0776e10d9b7ecf519dc
Pointer size: 131 Bytes
Size of remote file: 112 kB

Git LFS Details

SHA256: ccccee0d057bef8d9b40ba2dbe80c1bb024ecf3eeba62d2055327eb6b2abea42
Pointer size: 131 Bytes
Size of remote file: 109 kB

samples/unet_512x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 3a7d8e22794795e8b40076dc403729ec64ed04aed57d6614aee57defb9dd0088
Pointer size: 131 Bytes
Size of remote file: 160 kB

Git LFS Details

SHA256: 2b99166b36c2f1a70a3f0efa18c5d2e041a0ed0dc511e61e2e1fab28f6016bd3
Pointer size: 131 Bytes
Size of remote file: 147 kB

samples/unet_576x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 49de4a3333f896ffe4f8766fb80a20f7bf3bccd4cb3bed3d7ff499801aab2bbd
Pointer size: 131 Bytes
Size of remote file: 118 kB

Git LFS Details

SHA256: 7be444a2e793a7a9173b46b4a552cf5bfc0d82550a870f14c02e60c0600677f9
Pointer size: 131 Bytes
Size of remote file: 145 kB

samples/unet_640x320_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 501741e5bd0aa1cb01c0b826b10544b2413eb019527783534179f74dbb4bb99d
Pointer size: 130 Bytes
Size of remote file: 58.8 kB

Git LFS Details

SHA256: 68f39c2010d05c079bbaebdb8f2167ca8ab47be03bb90ae23c89f0241fbedeed
Pointer size: 130 Bytes
Size of remote file: 80.1 kB

samples/unet_640x384_0.jpg CHANGED Viewed

Git LFS Details

SHA256: ad552e368f7ba04bc4274b86464fae1d80efe29c3e91b9ea5ff2a18b4463023f
Pointer size: 130 Bytes
Size of remote file: 59.7 kB

Git LFS Details

SHA256: 79d603bf4e343609b3fe712fbd184f148699ec41f99d0deaa0e834912664bdd8
Pointer size: 130 Bytes
Size of remote file: 67.6 kB

samples/unet_640x448_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 4c8cf68d5afb65ae0d0f71a7d7a94be39c8cd7973e0c02b863493f1d48e24ed2
Pointer size: 130 Bytes
Size of remote file: 97.7 kB

Git LFS Details

SHA256: 016784ea0faf48a880c25687b20e4e3e3443ab257de4f9a90af87d141bff578b
Pointer size: 131 Bytes
Size of remote file: 117 kB

samples/unet_640x512_0.jpg CHANGED Viewed

Git LFS Details

SHA256: ec08ac216bba512d71c75b115506d189f7597782368c0c6371c5d6725bcce44a
Pointer size: 130 Bytes
Size of remote file: 86.6 kB

Git LFS Details

SHA256: 9db57726ace6b91eec0b52ffd706e713e549d42048fc9d25c407b1b033149991
Pointer size: 131 Bytes
Size of remote file: 129 kB

samples/unet_640x576_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 71c327a4d8a4ac4e071d03a1855150dc0103d332579a3fb1b758f69a139678f3
Pointer size: 131 Bytes
Size of remote file: 172 kB

Git LFS Details

SHA256: bcee3c291da6263d5bed9a77c308c83109057357e18fc68f66ddd0f6cf1b0f32
Pointer size: 131 Bytes
Size of remote file: 259 kB

samples/unet_640x640_0.jpg CHANGED Viewed

Git LFS Details

SHA256: 69d1d68c72172b179048c6c7272a8b0c778c3b263da4ff17f3d347daca4079ad
Pointer size: 130 Bytes
Size of remote file: 78.6 kB

Git LFS Details

SHA256: df4520edbc282e69128bb0659002eb530919fe6cf5dc4bb292d57e332ef8908c
Pointer size: 130 Bytes
Size of remote file: 28 kB

TRAIN.md → src/TRAIN.md RENAMED Viewed

File without changes

train.old.py → src/train.old.py RENAMED Viewed

File without changes

test.ipynb CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:79e3d9e6dd5f0879cb0aa79d4cd97dd23352c9d807e9f4a593ebc234322e668c
-size 5563216

 version https://git-lfs.github.com/spec/v1
+oid sha256:3da8c81f59608e0732fe9708b4cc2becf77ea6fa215601d0f30c057110e85b3c
+size 5563222

train.py CHANGED Viewed

@@ -31,7 +31,7 @@ project = "unet"
 batch_size = 48
 base_learning_rate = 5e-5
 min_learning_rate = 1e-5
-num_epochs = 50
 # samples/save per epoch
 sample_interval_share = 3
 use_wandb = True

 batch_size = 48
 base_learning_rate = 5e-5
 min_learning_rate = 1e-5
+num_epochs = 40
 # samples/save per epoch
 sample_interval_share = 3
 use_wandb = True

unet/diffusion_pytorch_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1443f2abd54e2b73c333d8556c0dc008a2f08f7a5e2823a553347f1eebc3cd61
 size 6184944280

 version https://git-lfs.github.com/spec/v1
+oid sha256:0fd75e6dcdd3c39a84c5927b5b77f6cb8591b8feb0a9996aeca9f336b84f9d89
 size 6184944280