Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +40 -0
- .job_config.json +139 -0
- claymation_stoners_z_image_v1.safetensors +3 -0
- claymation_stoners_z_image_v1_000002000.safetensors +3 -0
- claymation_stoners_z_image_v1_000002250.safetensors +3 -0
- claymation_stoners_z_image_v1_000002500.safetensors +3 -0
- claymation_stoners_z_image_v1_000002750.safetensors +3 -0
- config.yaml +203 -0
- log.txt +0 -0
- optimizer.pt +3 -0
- pid.txt +1 -0
- samples/1764475531114__000000000_0.jpg +3 -0
- samples/1764475535513__000000000_1.jpg +3 -0
- samples/1764475539875__000000000_2.jpg +3 -0
- samples/1764475543731__000000000_3.jpg +0 -0
- samples/1764475548071__000000000_4.jpg +3 -0
- samples/1764475870233__000000250_0.jpg +3 -0
- samples/1764475874667__000000250_1.jpg +3 -0
- samples/1764475879046__000000250_2.jpg +3 -0
- samples/1764475882942__000000250_3.jpg +0 -0
- samples/1764475887319__000000250_4.jpg +3 -0
- samples/1764476197013__000000500_0.jpg +3 -0
- samples/1764476201428__000000500_1.jpg +3 -0
- samples/1764476205796__000000500_2.jpg +0 -0
- samples/1764476209675__000000500_3.jpg +0 -0
- samples/1764476214030__000000500_4.jpg +3 -0
- samples/1764476527852__000000750_0.jpg +3 -0
- samples/1764476532266__000000750_1.jpg +3 -0
- samples/1764476536624__000000750_2.jpg +0 -0
- samples/1764476540501__000000750_3.jpg +0 -0
- samples/1764476544864__000000750_4.jpg +3 -0
- samples/1764476860552__000001000_0.jpg +3 -0
- samples/1764476864961__000001000_1.jpg +3 -0
- samples/1764476869317__000001000_2.jpg +0 -0
- samples/1764476873191__000001000_3.jpg +0 -0
- samples/1764476877547__000001000_4.jpg +3 -0
- samples/1764477190362__000001250_0.jpg +3 -0
- samples/1764477194781__000001250_1.jpg +3 -0
- samples/1764477199146__000001250_2.jpg +3 -0
- samples/1764477203031__000001250_3.jpg +0 -0
- samples/1764477207420__000001250_4.jpg +3 -0
- samples/1764477529187__000001500_0.jpg +3 -0
- samples/1764477533781__000001500_1.jpg +3 -0
- samples/1764477538164__000001500_2.jpg +3 -0
- samples/1764477542071__000001500_3.jpg +0 -0
- samples/1764477546468__000001500_4.jpg +3 -0
- samples/1764477865752__000001750_0.jpg +3 -0
- samples/1764477870194__000001750_1.jpg +3 -0
- samples/1764477874581__000001750_2.jpg +0 -0
- samples/1764477878497__000001750_3.jpg +0 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,43 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
samples/1764475531114__000000000_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
samples/1764475535513__000000000_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
samples/1764475539875__000000000_2.jpg filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
samples/1764475548071__000000000_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
samples/1764475870233__000000250_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
samples/1764475874667__000000250_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
samples/1764475879046__000000250_2.jpg filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
samples/1764475887319__000000250_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
samples/1764476197013__000000500_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
samples/1764476201428__000000500_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
samples/1764476214030__000000500_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
samples/1764476527852__000000750_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
samples/1764476532266__000000750_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
samples/1764476544864__000000750_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
samples/1764476860552__000001000_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
samples/1764476864961__000001000_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
samples/1764476877547__000001000_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
samples/1764477190362__000001250_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
samples/1764477194781__000001250_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
samples/1764477199146__000001250_2.jpg filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
samples/1764477207420__000001250_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
samples/1764477529187__000001500_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
samples/1764477533781__000001500_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
samples/1764477538164__000001500_2.jpg filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
samples/1764477546468__000001500_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
samples/1764477865752__000001750_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
samples/1764477870194__000001750_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
samples/1764478195344__000002000_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
samples/1764478199781__000002000_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
samples/1764478212482__000002000_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
samples/1764478525997__000002250_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
samples/1764478530416__000002250_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
samples/1764478543045__000002250_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
samples/1764478855775__000002500_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
samples/1764478860248__000002500_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
samples/1764478872907__000002500_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
samples/1764479194903__000002750_0.jpg filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
samples/1764479199322__000002750_1.jpg filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
samples/1764479211939__000002750_4.jpg filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
samples/1764479525472__000003000_0.jpg filter=lfs diff=lfs merge=lfs -text
|
.job_config.json
ADDED
|
@@ -0,0 +1,139 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"job": "extension",
|
| 3 |
+
"config": {
|
| 4 |
+
"name": "claymation_stoners_z_image_v1",
|
| 5 |
+
"process": [
|
| 6 |
+
{
|
| 7 |
+
"type": "diffusion_trainer",
|
| 8 |
+
"training_folder": "/app/ai-toolkit/output",
|
| 9 |
+
"sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
|
| 10 |
+
"device": "cuda",
|
| 11 |
+
"trigger_word": null,
|
| 12 |
+
"performance_log_every": 10,
|
| 13 |
+
"network": {
|
| 14 |
+
"type": "lora",
|
| 15 |
+
"linear": 32,
|
| 16 |
+
"linear_alpha": 32,
|
| 17 |
+
"conv": 16,
|
| 18 |
+
"conv_alpha": 16,
|
| 19 |
+
"lokr_full_rank": true,
|
| 20 |
+
"lokr_factor": -1,
|
| 21 |
+
"network_kwargs": {
|
| 22 |
+
"ignore_if_contains": []
|
| 23 |
+
}
|
| 24 |
+
},
|
| 25 |
+
"save": {
|
| 26 |
+
"dtype": "bf16",
|
| 27 |
+
"save_every": 250,
|
| 28 |
+
"max_step_saves_to_keep": 4,
|
| 29 |
+
"save_format": "diffusers",
|
| 30 |
+
"push_to_hub": false
|
| 31 |
+
},
|
| 32 |
+
"datasets": [
|
| 33 |
+
{
|
| 34 |
+
"folder_path": "/app/ai-toolkit/datasets/claymation_stoners",
|
| 35 |
+
"mask_path": null,
|
| 36 |
+
"mask_min_value": 0.1,
|
| 37 |
+
"default_caption": "",
|
| 38 |
+
"caption_ext": "txt",
|
| 39 |
+
"caption_dropout_rate": 0.05,
|
| 40 |
+
"cache_latents_to_disk": false,
|
| 41 |
+
"is_reg": false,
|
| 42 |
+
"network_weight": 1,
|
| 43 |
+
"resolution": [
|
| 44 |
+
512,
|
| 45 |
+
768,
|
| 46 |
+
1024
|
| 47 |
+
],
|
| 48 |
+
"controls": [],
|
| 49 |
+
"shrink_video_to_frames": true,
|
| 50 |
+
"num_frames": 1,
|
| 51 |
+
"do_i2v": true,
|
| 52 |
+
"flip_x": false,
|
| 53 |
+
"flip_y": false
|
| 54 |
+
}
|
| 55 |
+
],
|
| 56 |
+
"train": {
|
| 57 |
+
"batch_size": 1,
|
| 58 |
+
"bypass_guidance_embedding": false,
|
| 59 |
+
"steps": 3000,
|
| 60 |
+
"gradient_accumulation": 1,
|
| 61 |
+
"train_unet": true,
|
| 62 |
+
"train_text_encoder": false,
|
| 63 |
+
"gradient_checkpointing": true,
|
| 64 |
+
"noise_scheduler": "flowmatch",
|
| 65 |
+
"optimizer": "adamw8bit",
|
| 66 |
+
"timestep_type": "weighted",
|
| 67 |
+
"content_or_style": "balanced",
|
| 68 |
+
"optimizer_params": {
|
| 69 |
+
"weight_decay": 0.0001
|
| 70 |
+
},
|
| 71 |
+
"unload_text_encoder": false,
|
| 72 |
+
"cache_text_embeddings": true,
|
| 73 |
+
"lr": 0.0001,
|
| 74 |
+
"ema_config": {
|
| 75 |
+
"use_ema": false,
|
| 76 |
+
"ema_decay": 0.99
|
| 77 |
+
},
|
| 78 |
+
"skip_first_sample": false,
|
| 79 |
+
"force_first_sample": false,
|
| 80 |
+
"disable_sampling": false,
|
| 81 |
+
"dtype": "bf16",
|
| 82 |
+
"diff_output_preservation": false,
|
| 83 |
+
"diff_output_preservation_multiplier": 1,
|
| 84 |
+
"diff_output_preservation_class": "person",
|
| 85 |
+
"switch_boundary_every": 1,
|
| 86 |
+
"loss_type": "mse"
|
| 87 |
+
},
|
| 88 |
+
"model": {
|
| 89 |
+
"name_or_path": "Tongyi-MAI/Z-Image-Turbo",
|
| 90 |
+
"quantize": false,
|
| 91 |
+
"qtype": "qfloat8",
|
| 92 |
+
"quantize_te": true,
|
| 93 |
+
"qtype_te": "qfloat8",
|
| 94 |
+
"arch": "zimage:turbo",
|
| 95 |
+
"low_vram": true,
|
| 96 |
+
"model_kwargs": {},
|
| 97 |
+
"layer_offloading": false,
|
| 98 |
+
"layer_offloading_text_encoder_percent": 1,
|
| 99 |
+
"layer_offloading_transformer_percent": 1,
|
| 100 |
+
"assistant_lora_path": "ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v1.safetensors"
|
| 101 |
+
},
|
| 102 |
+
"sample": {
|
| 103 |
+
"sampler": "flowmatch",
|
| 104 |
+
"sample_every": 250,
|
| 105 |
+
"width": 1024,
|
| 106 |
+
"height": 1024,
|
| 107 |
+
"samples": [
|
| 108 |
+
{
|
| 109 |
+
"prompt": "claymation_stoners, Two male claymation figures, Bud and Spud, sit on a beige sofa in a messy living room. Bud, on the left, has brown hair, wide eyes, and a large smile, wearing a blue t-shirt with a \"Metallica\" logo and red shorts. He holds a rainbow-colored bong with green smoke emanating from its top. Spud, on the right, has a brown beanie, closed eyes, and a wide grin, wearing a tie-dye hoodie with a green cannabis leaf symbol and olive green cargo pants. Both characters exhibit lumpy surfaces and visible fingerprints, consistent with plasticine clay. The living room features a wooden coffee table in the foreground, laden with cluttered items. Two open pizza boxes, one with two slices remaining and the other with multiple slices, are present. Several snack bags, including a red bag spilling puffed snacks and a blue bag, are scattered on the table. Two retro-style grey game controllers with colorful buttons are also on the table. A crumpled white piece of paper sits on the floor next to one pizza box. Additional snacks and crumpled papers are visible under the table. The background wall is a pale purple or pink hue, textured and lumpy. Multiple posters with psychedelic mushroom designs in vibrant colors (purple, orange, green, yellow, blue) adorn the wall. A larger blue tapestry with a circular mandala pattern hangs to the right. A small yellow lampshade is visible on a table next to Spud. Warm, hazy lighting illuminates the scene, creating soft shadows. The floor is a dark, textured surface."
|
| 110 |
+
},
|
| 111 |
+
{
|
| 112 |
+
"prompt": "claymation_stoners, Two stop-motion claymation characters, Bud and Spud, sit on a light green lumpy sofa in a cluttered living room. Bud, on the left, wears a blue Metallica t-shirt and red shorts. He has a light brown sculpted hairstyle and an annoyed expression with wide eyes and a downturned mouth. He holds a grey retro video game controller with a black cord. Spud, on the right, wears a colorful tie-dye hoodie with a green beanie. He has a potato-shaped head with tired, red eyes and his tongue sticking out. He also holds a grey retro video game controller. The living room walls are a lumpy, textured off-white. Four psychedelic mushroom posters in various sizes and colors are on the left wall, and two more, including a large blue and purple tapestry-like poster, are on the right wall. A small yellow table lamp sits on a wooden side table behind Spud. In the foreground, a wooden coffee table holds various items. Two pizza boxes are stacked on the left, one open revealing several slices of pizza with red toppings. Numerous crumpled snack bags, including one blue and one red, are scattered on the table, some with their contents (small white nuggets) spilled out. A small pile of white crumpled paper is visible near the pizza boxes. A half-eaten orange snack wrapper labeled \"Koyca\" lies on the floor near the sofa on the right. A tall, multi-colored (green, yellow, red, blue) vase or bong is behind the open pizza box. Warm, hazy, orange-yellow lighting illuminates the scene, with some purple and pink light accents on the walls and characters, suggesting a dimly lit room with atmospheric lighting. Wisps of white smoke are visible in the air above Bud and Spud. The clay characters and props exhibit a gritty, handmade plasticine texture with visible fingerprints and lumpy surfaces. The overall aesthetic is miniature and realistic."
|
| 113 |
+
},
|
| 114 |
+
{
|
| 115 |
+
"prompt": "claymation_stoners, Two claymation characters, Bud and Spud, sit on a lumpy, textured, light brown sofa in a cluttered living room. Bud, on the left, wears a blue t-shirt with \"METALLICA\" written across it in white, and red shorts. He has brown hair, closed eyes, and an open mouth with visible teeth, holding a white cigarette or pipe from which a wisp of smoke rises. His right hand holds a gray and white retro game controller. His left hand rests on his lap. Spud, on the right, wears a colorful tie-dye hoodie, grey cargo pants, and a dark brown beanie. His eyes are closed, and his mouth is a small, curved line. Spud's right hand extends toward Bud's left arm. A dark brown coffee table sits in front of the characters. On the table, an open beige pizza box with several slices of pepperoni pizza is visible on the left. Next to it, a rectangular wooden tray or box contains a single pizza slice. Further right on the table, a crumpled red soda can, a blue snack bag with yellow contents, and another pizza slice are present. A crumpled red snack bag and another red soda can are on the floor next to the table. The floor is light brown. The walls are light brown with visible texture. Three framed psychedelic mushroom posters hang on the left wall, with one more visible on the right wall near a yellow lampshade. The lighting is warm and hazy."
|
| 116 |
+
},
|
| 117 |
+
{
|
| 118 |
+
"prompt": "claymation_stoners, Two claymation figures, viewed from behind, sit on a light brown couch, facing a retro television displaying \"GAME OVER\" in pixelated block letters. The figure on the left has short, light brown hair and wears a light blue shirt with a faint green stripe. The figure on the right wears a brown cap and a green, yellow, and orange striped scarf over a light green garment. The couch is a solid, light brown color with a textured, lumpy surface. The television is dark brown with a thick frame, resting on a darker brown cabinet with two drawers. The screen background is a textured, light blue, resembling woven fabric. The \"GAME OVER\" letters are light brown. The background wall is a textured, off-white to light brown, with hints of smoke or steam rising from behind the television on both sides. A multicolored, abstract art piece hangs on the wall to the far left. A dark red or brown abstract element is on the wall to the far right. Warm, hazy lighting illuminates the scene, casting subtle glows around the television."
|
| 119 |
+
},
|
| 120 |
+
{
|
| 121 |
+
"prompt": "claymation_stoners, Two claymation characters, Bud and Spud, sit on a lumpy brown couch in a messy living room. Bud, on the left, has light brown skin, dark brown hair, a sad expression, and wears a blue t-shirt with \"m1ndb0tz\" and red shorts. He holds a multicolored green, orange, red, and yellow bong in his right hand. Spud, on the right, has a darker brown skin tone, a sad expression, and wears a dark green beanie and a multicolored striped hoodie. He holds a slice of pepperoni pizza in his right hand. A brown wooden coffee table in front of them holds two open pizza boxes, one with two pepperoni pizza slices. Other items on the table include two grey retro game controllers, two closed snack bags, one open red snack bag with yellow contents, a small white cylindrical object, a grey cylindrical electronic device with a wire, and scattered coins. The textured dark brown floor also has scattered debris and a red snack wrapper. The light brown, rough-textured wall behind them features three framed art pieces: two rectangular posters with psychedelic mushroom designs and text \"LIZARD\" and \"LIFE GAIN\", and a vertical poster with abstract multicolored swirls. A dark brown doorframe appears on the left wall section. A small yellow lamp on a stand stands behind Spud. Warm, hazy lighting fills the scene, and smoke or haze rises from behind Bud. The overall texture is gritty, lumpy plasticine with visible fingerprints."
|
| 122 |
+
}
|
| 123 |
+
],
|
| 124 |
+
"neg": "",
|
| 125 |
+
"seed": 42,
|
| 126 |
+
"walk_seed": true,
|
| 127 |
+
"guidance_scale": 1,
|
| 128 |
+
"sample_steps": 8,
|
| 129 |
+
"num_frames": 1,
|
| 130 |
+
"fps": 1
|
| 131 |
+
}
|
| 132 |
+
}
|
| 133 |
+
]
|
| 134 |
+
},
|
| 135 |
+
"meta": {
|
| 136 |
+
"name": "[name]",
|
| 137 |
+
"version": "1.0"
|
| 138 |
+
}
|
| 139 |
+
}
|
claymation_stoners_z_image_v1.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc3c22c10e6fd3eaddc050e9106ab73bfca990780b830a6cf8d3fd4e6652bcb0
|
| 3 |
+
size 170128256
|
claymation_stoners_z_image_v1_000002000.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3883d470069935b6e398f301934c311c8b1b09b6dec623d3325c91aedcdbe01
|
| 3 |
+
size 170128256
|
claymation_stoners_z_image_v1_000002250.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c171feacd09bf98014d0acaad4bbf298d30974b2d7efad2144c79b406a2bbe2d
|
| 3 |
+
size 170128256
|
claymation_stoners_z_image_v1_000002500.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89b88be9cd5452c03d36797fbcd0d718e8f8380bf3fd9d9616ed1a2ed1eb784a
|
| 3 |
+
size 170128256
|
claymation_stoners_z_image_v1_000002750.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:484a3fad507213fe183d0cabc4de2c6bdf102b14519eef17c502e90d5b9be327
|
| 3 |
+
size 170128256
|
config.yaml
ADDED
|
@@ -0,0 +1,203 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
job: extension
|
| 2 |
+
config:
|
| 3 |
+
name: claymation_stoners_z_image_v1
|
| 4 |
+
process:
|
| 5 |
+
- type: diffusion_trainer
|
| 6 |
+
training_folder: /app/ai-toolkit/output
|
| 7 |
+
sqlite_db_path: /app/ai-toolkit/aitk_db.db
|
| 8 |
+
device: cuda
|
| 9 |
+
trigger_word: null
|
| 10 |
+
performance_log_every: 10
|
| 11 |
+
network:
|
| 12 |
+
type: lora
|
| 13 |
+
linear: 32
|
| 14 |
+
linear_alpha: 32
|
| 15 |
+
conv: 16
|
| 16 |
+
conv_alpha: 16
|
| 17 |
+
lokr_full_rank: true
|
| 18 |
+
lokr_factor: -1
|
| 19 |
+
network_kwargs:
|
| 20 |
+
ignore_if_contains: []
|
| 21 |
+
save:
|
| 22 |
+
dtype: bf16
|
| 23 |
+
save_every: 250
|
| 24 |
+
max_step_saves_to_keep: 4
|
| 25 |
+
save_format: diffusers
|
| 26 |
+
push_to_hub: false
|
| 27 |
+
datasets:
|
| 28 |
+
- folder_path: /app/ai-toolkit/datasets/claymation_stoners
|
| 29 |
+
mask_path: null
|
| 30 |
+
mask_min_value: 0.1
|
| 31 |
+
default_caption: ''
|
| 32 |
+
caption_ext: txt
|
| 33 |
+
caption_dropout_rate: 0.05
|
| 34 |
+
cache_latents_to_disk: false
|
| 35 |
+
is_reg: false
|
| 36 |
+
network_weight: 1
|
| 37 |
+
resolution:
|
| 38 |
+
- 512
|
| 39 |
+
- 768
|
| 40 |
+
- 1024
|
| 41 |
+
controls: []
|
| 42 |
+
shrink_video_to_frames: true
|
| 43 |
+
num_frames: 1
|
| 44 |
+
do_i2v: true
|
| 45 |
+
flip_x: false
|
| 46 |
+
flip_y: false
|
| 47 |
+
train:
|
| 48 |
+
batch_size: 1
|
| 49 |
+
bypass_guidance_embedding: false
|
| 50 |
+
steps: 3000
|
| 51 |
+
gradient_accumulation: 1
|
| 52 |
+
train_unet: true
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
gradient_checkpointing: true
|
| 55 |
+
noise_scheduler: flowmatch
|
| 56 |
+
optimizer: adamw8bit
|
| 57 |
+
timestep_type: weighted
|
| 58 |
+
content_or_style: balanced
|
| 59 |
+
optimizer_params:
|
| 60 |
+
weight_decay: 0.0001
|
| 61 |
+
unload_text_encoder: false
|
| 62 |
+
cache_text_embeddings: true
|
| 63 |
+
lr: 0.0001
|
| 64 |
+
ema_config:
|
| 65 |
+
use_ema: false
|
| 66 |
+
ema_decay: 0.99
|
| 67 |
+
skip_first_sample: false
|
| 68 |
+
force_first_sample: false
|
| 69 |
+
disable_sampling: false
|
| 70 |
+
dtype: bf16
|
| 71 |
+
diff_output_preservation: false
|
| 72 |
+
diff_output_preservation_multiplier: 1
|
| 73 |
+
diff_output_preservation_class: person
|
| 74 |
+
switch_boundary_every: 1
|
| 75 |
+
loss_type: mse
|
| 76 |
+
model:
|
| 77 |
+
name_or_path: Tongyi-MAI/Z-Image-Turbo
|
| 78 |
+
quantize: false
|
| 79 |
+
qtype: qfloat8
|
| 80 |
+
quantize_te: true
|
| 81 |
+
qtype_te: qfloat8
|
| 82 |
+
arch: zimage:turbo
|
| 83 |
+
low_vram: true
|
| 84 |
+
model_kwargs: {}
|
| 85 |
+
layer_offloading: false
|
| 86 |
+
layer_offloading_text_encoder_percent: 1
|
| 87 |
+
layer_offloading_transformer_percent: 1
|
| 88 |
+
assistant_lora_path: ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v1.safetensors
|
| 89 |
+
sample:
|
| 90 |
+
sampler: flowmatch
|
| 91 |
+
sample_every: 250
|
| 92 |
+
width: 1024
|
| 93 |
+
height: 1024
|
| 94 |
+
samples:
|
| 95 |
+
- prompt: claymation_stoners, Two male claymation figures, Bud and Spud, sit
|
| 96 |
+
on a beige sofa in a messy living room. Bud, on the left, has brown hair,
|
| 97 |
+
wide eyes, and a large smile, wearing a blue t-shirt with a "Metallica"
|
| 98 |
+
logo and red shorts. He holds a rainbow-colored bong with green smoke emanating
|
| 99 |
+
from its top. Spud, on the right, has a brown beanie, closed eyes, and a
|
| 100 |
+
wide grin, wearing a tie-dye hoodie with a green cannabis leaf symbol and
|
| 101 |
+
olive green cargo pants. Both characters exhibit lumpy surfaces and visible
|
| 102 |
+
fingerprints, consistent with plasticine clay. The living room features
|
| 103 |
+
a wooden coffee table in the foreground, laden with cluttered items. Two
|
| 104 |
+
open pizza boxes, one with two slices remaining and the other with multiple
|
| 105 |
+
slices, are present. Several snack bags, including a red bag spilling puffed
|
| 106 |
+
snacks and a blue bag, are scattered on the table. Two retro-style grey
|
| 107 |
+
game controllers with colorful buttons are also on the table. A crumpled
|
| 108 |
+
white piece of paper sits on the floor next to one pizza box. Additional
|
| 109 |
+
snacks and crumpled papers are visible under the table. The background
|
| 110 |
+
wall is a pale purple or pink hue, textured and lumpy. Multiple posters
|
| 111 |
+
with psychedelic mushroom designs in vibrant colors (purple, orange, green,
|
| 112 |
+
yellow, blue) adorn the wall. A larger blue tapestry with a circular mandala
|
| 113 |
+
pattern hangs to the right. A small yellow lampshade is visible on a table
|
| 114 |
+
next to Spud. Warm, hazy lighting illuminates the scene, creating soft shadows.
|
| 115 |
+
The floor is a dark, textured surface.
|
| 116 |
+
- prompt: claymation_stoners, Two stop-motion claymation characters, Bud and
|
| 117 |
+
Spud, sit on a light green lumpy sofa in a cluttered living room. Bud, on
|
| 118 |
+
the left, wears a blue Metallica t-shirt and red shorts. He has a light
|
| 119 |
+
brown sculpted hairstyle and an annoyed expression with wide eyes and a
|
| 120 |
+
downturned mouth. He holds a grey retro video game controller with a black
|
| 121 |
+
cord. Spud, on the right, wears a colorful tie-dye hoodie with a green beanie.
|
| 122 |
+
He has a potato-shaped head with tired, red eyes and his tongue sticking
|
| 123 |
+
out. He also holds a grey retro video game controller. The living room
|
| 124 |
+
walls are a lumpy, textured off-white. Four psychedelic mushroom posters
|
| 125 |
+
in various sizes and colors are on the left wall, and two more, including
|
| 126 |
+
a large blue and purple tapestry-like poster, are on the right wall. A small
|
| 127 |
+
yellow table lamp sits on a wooden side table behind Spud. In the foreground,
|
| 128 |
+
a wooden coffee table holds various items. Two pizza boxes are stacked on
|
| 129 |
+
the left, one open revealing several slices of pizza with red toppings.
|
| 130 |
+
Numerous crumpled snack bags, including one blue and one red, are scattered
|
| 131 |
+
on the table, some with their contents (small white nuggets) spilled out.
|
| 132 |
+
A small pile of white crumpled paper is visible near the pizza boxes. A
|
| 133 |
+
half-eaten orange snack wrapper labeled "Koyca" lies on the floor near the
|
| 134 |
+
sofa on the right. A tall, multi-colored (green, yellow, red, blue) vase
|
| 135 |
+
or bong is behind the open pizza box. Warm, hazy, orange-yellow lighting
|
| 136 |
+
illuminates the scene, with some purple and pink light accents on the walls
|
| 137 |
+
and characters, suggesting a dimly lit room with atmospheric lighting. Wisps
|
| 138 |
+
of white smoke are visible in the air above Bud and Spud. The clay characters
|
| 139 |
+
and props exhibit a gritty, handmade plasticine texture with visible fingerprints
|
| 140 |
+
and lumpy surfaces. The overall aesthetic is miniature and realistic.
|
| 141 |
+
- prompt: claymation_stoners, Two claymation characters, Bud and Spud, sit on
|
| 142 |
+
a lumpy, textured, light brown sofa in a cluttered living room. Bud, on
|
| 143 |
+
the left, wears a blue t-shirt with "METALLICA" written across it in white,
|
| 144 |
+
and red shorts. He has brown hair, closed eyes, and an open mouth with visible
|
| 145 |
+
teeth, holding a white cigarette or pipe from which a wisp of smoke rises.
|
| 146 |
+
His right hand holds a gray and white retro game controller. His left hand
|
| 147 |
+
rests on his lap. Spud, on the right, wears a colorful tie-dye hoodie, grey
|
| 148 |
+
cargo pants, and a dark brown beanie. His eyes are closed, and his mouth
|
| 149 |
+
is a small, curved line. Spud's right hand extends toward Bud's left arm.
|
| 150 |
+
A dark brown coffee table sits in front of the characters. On the table,
|
| 151 |
+
an open beige pizza box with several slices of pepperoni pizza is visible
|
| 152 |
+
on the left. Next to it, a rectangular wooden tray or box contains a single
|
| 153 |
+
pizza slice. Further right on the table, a crumpled red soda can, a blue
|
| 154 |
+
snack bag with yellow contents, and another pizza slice are present. A crumpled
|
| 155 |
+
red snack bag and another red soda can are on the floor next to the table.
|
| 156 |
+
The floor is light brown. The walls are light brown with visible texture.
|
| 157 |
+
Three framed psychedelic mushroom posters hang on the left wall, with one
|
| 158 |
+
more visible on the right wall near a yellow lampshade. The lighting is
|
| 159 |
+
warm and hazy.
|
| 160 |
+
- prompt: claymation_stoners, Two claymation figures, viewed from behind, sit
|
| 161 |
+
on a light brown couch, facing a retro television displaying "GAME OVER"
|
| 162 |
+
in pixelated block letters. The figure on the left has short, light brown
|
| 163 |
+
hair and wears a light blue shirt with a faint green stripe. The figure
|
| 164 |
+
on the right wears a brown cap and a green, yellow, and orange striped scarf
|
| 165 |
+
over a light green garment. The couch is a solid, light brown color with
|
| 166 |
+
a textured, lumpy surface. The television is dark brown with a thick frame,
|
| 167 |
+
resting on a darker brown cabinet with two drawers. The screen background
|
| 168 |
+
is a textured, light blue, resembling woven fabric. The "GAME OVER" letters
|
| 169 |
+
are light brown. The background wall is a textured, off-white to light brown,
|
| 170 |
+
with hints of smoke or steam rising from behind the television on both sides.
|
| 171 |
+
A multicolored, abstract art piece hangs on the wall to the far left. A
|
| 172 |
+
dark red or brown abstract element is on the wall to the far right. Warm,
|
| 173 |
+
hazy lighting illuminates the scene, casting subtle glows around the television.
|
| 174 |
+
- prompt: 'claymation_stoners, Two claymation characters, Bud and Spud, sit
|
| 175 |
+
on a lumpy brown couch in a messy living room. Bud, on the left, has light
|
| 176 |
+
brown skin, dark brown hair, a sad expression, and wears a blue t-shirt
|
| 177 |
+
with "m1ndb0tz" and red shorts. He holds a multicolored green, orange, red,
|
| 178 |
+
and yellow bong in his right hand. Spud, on the right, has a darker brown
|
| 179 |
+
skin tone, a sad expression, and wears a dark green beanie and a multicolored
|
| 180 |
+
striped hoodie. He holds a slice of pepperoni pizza in his right hand. A
|
| 181 |
+
brown wooden coffee table in front of them holds two open pizza boxes, one
|
| 182 |
+
with two pepperoni pizza slices. Other items on the table include two grey
|
| 183 |
+
retro game controllers, two closed snack bags, one open red snack bag with
|
| 184 |
+
yellow contents, a small white cylindrical object, a grey cylindrical electronic
|
| 185 |
+
device with a wire, and scattered coins. The textured dark brown floor also
|
| 186 |
+
has scattered debris and a red snack wrapper. The light brown, rough-textured
|
| 187 |
+
wall behind them features three framed art pieces: two rectangular posters
|
| 188 |
+
with psychedelic mushroom designs and text "LIZARD" and "LIFE GAIN", and
|
| 189 |
+
a vertical poster with abstract multicolored swirls. A dark brown doorframe
|
| 190 |
+
appears on the left wall section. A small yellow lamp on a stand stands
|
| 191 |
+
behind Spud. Warm, hazy lighting fills the scene, and smoke or haze rises
|
| 192 |
+
from behind Bud. The overall texture is gritty, lumpy plasticine with visible
|
| 193 |
+
fingerprints.'
|
| 194 |
+
neg: ''
|
| 195 |
+
seed: 42
|
| 196 |
+
walk_seed: true
|
| 197 |
+
guidance_scale: 1
|
| 198 |
+
sample_steps: 8
|
| 199 |
+
num_frames: 1
|
| 200 |
+
fps: 1
|
| 201 |
+
meta:
|
| 202 |
+
name: claymation_stoners_z_image_v1
|
| 203 |
+
version: '1.0'
|
log.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:513265caf209699c25289df90e8255075bc3c3f99c711c5d9c6cc85193902844
|
| 3 |
+
size 173288293
|
pid.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
638
|
samples/1764475531114__000000000_0.jpg
ADDED
|
Git LFS Details
|
samples/1764475535513__000000000_1.jpg
ADDED
|
Git LFS Details
|
samples/1764475539875__000000000_2.jpg
ADDED
|
Git LFS Details
|
samples/1764475543731__000000000_3.jpg
ADDED
|
samples/1764475548071__000000000_4.jpg
ADDED
|
Git LFS Details
|
samples/1764475870233__000000250_0.jpg
ADDED
|
Git LFS Details
|
samples/1764475874667__000000250_1.jpg
ADDED
|
Git LFS Details
|
samples/1764475879046__000000250_2.jpg
ADDED
|
Git LFS Details
|
samples/1764475882942__000000250_3.jpg
ADDED
|
samples/1764475887319__000000250_4.jpg
ADDED
|
Git LFS Details
|
samples/1764476197013__000000500_0.jpg
ADDED
|
Git LFS Details
|
samples/1764476201428__000000500_1.jpg
ADDED
|
Git LFS Details
|
samples/1764476205796__000000500_2.jpg
ADDED
|
samples/1764476209675__000000500_3.jpg
ADDED
|
samples/1764476214030__000000500_4.jpg
ADDED
|
Git LFS Details
|
samples/1764476527852__000000750_0.jpg
ADDED
|
Git LFS Details
|
samples/1764476532266__000000750_1.jpg
ADDED
|
Git LFS Details
|
samples/1764476536624__000000750_2.jpg
ADDED
|
samples/1764476540501__000000750_3.jpg
ADDED
|
samples/1764476544864__000000750_4.jpg
ADDED
|
Git LFS Details
|
samples/1764476860552__000001000_0.jpg
ADDED
|
Git LFS Details
|
samples/1764476864961__000001000_1.jpg
ADDED
|
Git LFS Details
|
samples/1764476869317__000001000_2.jpg
ADDED
|
samples/1764476873191__000001000_3.jpg
ADDED
|
samples/1764476877547__000001000_4.jpg
ADDED
|
Git LFS Details
|
samples/1764477190362__000001250_0.jpg
ADDED
|
Git LFS Details
|
samples/1764477194781__000001250_1.jpg
ADDED
|
Git LFS Details
|
samples/1764477199146__000001250_2.jpg
ADDED
|
Git LFS Details
|
samples/1764477203031__000001250_3.jpg
ADDED
|
samples/1764477207420__000001250_4.jpg
ADDED
|
Git LFS Details
|
samples/1764477529187__000001500_0.jpg
ADDED
|
Git LFS Details
|
samples/1764477533781__000001500_1.jpg
ADDED
|
Git LFS Details
|
samples/1764477538164__000001500_2.jpg
ADDED
|
Git LFS Details
|
samples/1764477542071__000001500_3.jpg
ADDED
|
samples/1764477546468__000001500_4.jpg
ADDED
|
Git LFS Details
|
samples/1764477865752__000001750_0.jpg
ADDED
|
Git LFS Details
|
samples/1764477870194__000001750_1.jpg
ADDED
|
Git LFS Details
|
samples/1764477874581__000001750_2.jpg
ADDED
|
samples/1764477878497__000001750_3.jpg
ADDED
|