PseudoTerminal X commited on
Commit
fec91dc
1 Parent(s): 6cfff2b

Trained for 91 epochs and 9600 steps.

Browse files

Trained with datasets ['text-embeds-sdxl-nofilter', 'photo-concept-bucket']
Learning rate 4e-07, batch size 32, and 2 gradient accumulation steps.
Used DDPM noise scheduler for training with v_prediction prediction type and rescaled_betas_zero_snr=True
Using 'trailing' timestep spacing.
Base model: ptx0/terminus-xl-velocity-v2
VAE: madebyollin/sdxl-vae-fp16-fix

README.md CHANGED
@@ -43,7 +43,7 @@ You may reuse the base model text encoder for inference.
43
 
44
  ## Training settings
45
 
46
- - Training epochs: 0
47
  - Training steps: 9600
48
  - Learning rate: 4e-07
49
  - Effective batch size: 512
@@ -59,14 +59,6 @@ You may reuse the base model text encoder for inference.
59
 
60
  ## Datasets
61
 
62
- ### dalle3
63
- - Repeats: 0
64
- - Total number of images: ~461848
65
- - Total number of aspect buckets: 21
66
- - Resolution: 1.0 megapixels
67
- - Cropped: False
68
- - Crop style: None
69
- - Crop aspect: None
70
  ### photo-concept-bucket
71
  - Repeats: 0
72
  - Total number of images: ~557568
@@ -76,3 +68,29 @@ You may reuse the base model text encoder for inference.
76
  - Crop style: random
77
  - Crop aspect: random
78
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
 
44
  ## Training settings
45
 
46
+ - Training epochs: 91
47
  - Training steps: 9600
48
  - Learning rate: 4e-07
49
  - Effective batch size: 512
 
59
 
60
  ## Datasets
61
 
 
 
 
 
 
 
 
 
62
  ### photo-concept-bucket
63
  - Repeats: 0
64
  - Total number of images: ~557568
 
68
  - Crop style: random
69
  - Crop aspect: random
70
 
71
+
72
+ ## Inference
73
+
74
+
75
+ ```python
76
+ None
77
+
78
+ model_id = "terminus-xl-velocity-training"
79
+ prompt = "a cute anime character named toast holding a sign that says SOON, sitting next to a red square on her left side, and a transparent sphere on her right side"
80
+ negative_prompt = "malformed, disgusting, overexposed, washed-out"
81
+
82
+ pipeline = DiffusionPipeline.from_pretrained(model_id)
83
+ pipeline.to('cuda' if torch.cuda.is_available() else 'mps' if torch.backends.mps.is_available() else 'cpu')
84
+ image = pipeline(
85
+ prompt=prompt,
86
+ negative_prompt='',
87
+ num_inference_steps=30,
88
+ generator=torch.Generator(device='cuda' if torch.cuda.is_available() else 'mps' if torch.backends.mps.is_available() else 'cpu').manual_seed(1641421826),
89
+ width=1152,
90
+ height=768,
91
+ guidance_scale=7.5,
92
+ guidance_rescale=0.7,
93
+ ).images[0]
94
+ image.save(f"output.png", format="PNG")
95
+ ```
96
+
model_index.json CHANGED
@@ -1,19 +1,27 @@
1
  {
2
  "_class_name": "StableDiffusionXLPipeline",
3
- "_diffusers_version": "0.26.0",
4
- "_name_or_path": "ptx0/sdxl-base",
 
 
 
 
5
  "force_zeros_for_empty_prompt": true,
 
 
 
 
6
  "scheduler": [
7
  "diffusers",
8
  "EulerDiscreteScheduler"
9
  ],
10
  "text_encoder": [
11
- "transformers",
12
- "CLIPTextModel"
13
  ],
14
  "text_encoder_2": [
15
- "transformers",
16
- "CLIPTextModelWithProjection"
17
  ],
18
  "tokenizer": [
19
  "transformers",
 
1
  {
2
  "_class_name": "StableDiffusionXLPipeline",
3
+ "_diffusers_version": "0.29.0.dev0",
4
+ "_name_or_path": "ptx0/terminus-xl-velocity-v2",
5
+ "feature_extractor": [
6
+ null,
7
+ null
8
+ ],
9
  "force_zeros_for_empty_prompt": true,
10
+ "image_encoder": [
11
+ null,
12
+ null
13
+ ],
14
  "scheduler": [
15
  "diffusers",
16
  "EulerDiscreteScheduler"
17
  ],
18
  "text_encoder": [
19
+ null,
20
+ null
21
  ],
22
  "text_encoder_2": [
23
+ null,
24
+ null
25
  ],
26
  "tokenizer": [
27
  "transformers",
unet/config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.29.0.dev0",
4
- "_name_or_path": "/home/user/training/lite-models/checkpoint-9500",
5
  "act_fn": "silu",
6
  "addition_embed_type": "text_time",
7
  "addition_embed_type_num_heads": 64,
 
1
  {
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.29.0.dev0",
4
+ "_name_or_path": "/home/user/training/lite-models/checkpoint-9600",
5
  "act_fn": "silu",
6
  "addition_embed_type": "text_time",
7
  "addition_embed_type_num_heads": 64,
unet/diffusion_pytorch_model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e96ca08e5a623ca872923ade0185aa2f99fdb6c443dc8e3d9534ca9aa6f8984a
3
  size 4994180736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843c895649bb156eadc0d9c1dadf194d991a238a556b8a645cc76b0d6214c768
3
  size 4994180736
unet/diffusion_pytorch_model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:517986623bd50039229e58b00b55933c4f430ea3400970a907ce034f7184302e
3
  size 140970624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c134a3662ade3872068c83c11d5eade35599d091005d13f96fe89d2ab63f774
3
  size 140970624