Spaces:
ginipick
/
Running on Zero

ginipick commited on
Commit
dcb1878
·
verified ·
1 Parent(s): f7aa706

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +49 -46
app.py CHANGED
@@ -15,13 +15,20 @@ import gradio as gr
15
  import os
16
  import random
17
  import gc
18
-
 
 
19
  # 메모리 관리 설정
20
  torch.cuda.empty_cache()
21
  gc.collect()
22
  os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'
23
  torch.backends.cudnn.benchmark = True
24
  torch.backends.cuda.matmul.allow_tf32 = True
 
 
 
 
 
25
 
26
  # 상수 정의
27
  MAX_SEED = 2**32 - 1
@@ -63,7 +70,10 @@ def get_fashion_pipe():
63
  torch_dtype=torch.float16,
64
  use_auth_token=HF_TOKEN
65
  )
66
- fashion_pipe.enable_memory_efficient_attention()
 
 
 
67
  fashion_pipe.enable_sequential_cpu_offload()
68
  return fashion_pipe
69
 
@@ -129,51 +139,44 @@ def contains_korean(text):
129
 
130
  @spaces.GPU()
131
  def generate_fashion(prompt, mode, cfg_scale, steps, randomize_seed, seed, width, height, lora_scale, progress=gr.Progress(track_tqdm=True)):
132
- torch.cuda.empty_cache()
133
 
134
- if contains_korean(prompt):
135
- translator = get_translator()
136
- translated = translator(prompt)[0]['translation_text']
137
- actual_prompt = translated
138
- else:
139
- actual_prompt = prompt
140
-
141
- # 모드에 따른 LoRA 로딩 및 트리거워드 설정
142
- pipe = get_fashion_pipe()
143
- if mode == "Generate Model":
144
- pipe = load_lora(pipe, MODEL_LORA_REPO)
145
- trigger_word = "fashion photography, professional model"
146
- else:
147
- pipe = load_lora(pipe, CLOTHES_LORA_REPO)
148
- trigger_word = "upper clothing, fashion item"
149
-
150
- if randomize_seed:
151
- seed = random.randint(0, MAX_SEED)
152
- generator = torch.Generator(device="cuda").manual_seed(seed)
153
-
154
- # 이미지 크기 제한
155
- width = min(width, 1024)
156
- height = min(height, 1024)
157
-
158
- progress(0, "Starting fashion generation...")
159
-
160
- for i in range(1, steps + 1):
161
- if i % (steps // 10) == 0:
162
- progress(i / steps * 100, f"Processing step {i} of {steps}...")
163
-
164
- image = pipe(
165
- prompt=f"{actual_prompt} {trigger_word}",
166
- num_inference_steps=steps,
167
- guidance_scale=cfg_scale,
168
- width=width,
169
- height=height,
170
- generator=generator,
171
- joint_attention_kwargs={"scale": lora_scale},
172
- ).images[0]
173
-
174
- progress(100, "Completed!")
175
- return image, seed
176
-
177
 
178
  def leffa_predict(src_image_path, ref_image_path, control_type):
179
  torch.cuda.empty_cache()
 
15
  import os
16
  import random
17
  import gc
18
+ # 메모리 관리 설정 추가
19
+ import torch.backends.cuda
20
+ torch.backends.cuda.max_split_size_mb = 128 # 메모리 분할 크기 제한
21
  # 메모리 관리 설정
22
  torch.cuda.empty_cache()
23
  gc.collect()
24
  os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'
25
  torch.backends.cudnn.benchmark = True
26
  torch.backends.cuda.matmul.allow_tf32 = True
27
+ def clear_memory():
28
+ if torch.cuda.is_available():
29
+ torch.cuda.empty_cache()
30
+ torch.cuda.synchronize()
31
+ gc.collect()
32
 
33
  # 상수 정의
34
  MAX_SEED = 2**32 - 1
 
70
  torch_dtype=torch.float16,
71
  use_auth_token=HF_TOKEN
72
  )
73
+ try:
74
+ fashion_pipe.enable_xformers_memory_efficient_attention() # 수정된 부분
75
+ except Exception as e:
76
+ print(f"Warning: Could not enable memory efficient attention: {e}")
77
  fashion_pipe.enable_sequential_cpu_offload()
78
  return fashion_pipe
79
 
 
139
 
140
  @spaces.GPU()
141
  def generate_fashion(prompt, mode, cfg_scale, steps, randomize_seed, seed, width, height, lora_scale, progress=gr.Progress(track_tqdm=True)):
142
+ clear_memory() # 메모리 정리
143
 
144
+ try:
145
+ if contains_korean(prompt):
146
+ translator = get_translator()
147
+ translated = translator(prompt)[0]['translation_text']
148
+ actual_prompt = translated
149
+ else:
150
+ actual_prompt = prompt
151
+
152
+ pipe = get_fashion_pipe()
153
+
154
+ # 메모리 사용량 제한을 위한 크기 조정
155
+ width = min(width, 768) # 최대 크기 제한
156
+ height = min(height, 768) # 최대 크기 제한
157
+
158
+ if randomize_seed:
159
+ seed = random.randint(0, MAX_SEED)
160
+ generator = torch.Generator(device="cuda").manual_seed(seed)
161
+
162
+ progress(0, "Starting fashion generation...")
163
+
164
+ image = pipe(
165
+ prompt=f"{actual_prompt} {trigger_word}",
166
+ num_inference_steps=min(steps, 30), # 스텝 수 제한
167
+ guidance_scale=cfg_scale,
168
+ width=width,
169
+ height=height,
170
+ generator=generator,
171
+ joint_attention_kwargs={"scale": lora_scale},
172
+ ).images[0]
173
+
174
+ clear_memory() # 메모리 정리
175
+ return image, seed
176
+
177
+ except Exception as e:
178
+ clear_memory() # 오류 발생 시에도 메모리 정리
179
+ raise e
 
 
 
 
 
 
 
180
 
181
  def leffa_predict(src_image_path, ref_image_path, control_type):
182
  torch.cuda.empty_cache()