SoggyKiwi commited on
Commit
8c65b05
1 Parent(s): d7cb9bc

fix various total variation bugs

Browse files
Files changed (1) hide show
  1. app.py +7 -7
app.py CHANGED
@@ -21,7 +21,7 @@ def total_variation_loss(img):
21
  pixel_dif2 = img[:, :, :, 1:] - img[:, :, :, :-1]
22
  return (torch.sum(torch.abs(pixel_dif1)) + torch.sum(torch.abs(pixel_dif2)))
23
 
24
- def process_image(input_image, learning_rate, tv_loss, iterations, n_targets, seed):
25
  if input_image is None:
26
  return None
27
 
@@ -42,9 +42,9 @@ def process_image(input_image, learning_rate, tv_loss, iterations, n_targets, se
42
  final_activations = get_encoder_activations(pixel_values)
43
  logits = model.classifier(final_activations[0])
44
 
45
- original_loss = -logits[random_indices].sum()
46
  tv_loss = total_variation_loss(pixel_values)
47
- total_loss = original_loss + 0.00625 * tv_loss
48
  total_loss.backward()
49
 
50
  with torch.no_grad():
@@ -60,11 +60,11 @@ iface = gr.Interface(
60
  fn=process_image,
61
  inputs=[
62
  gr.Image(type="pil"),
63
- gr.Number(value=10.0, minimum=0, label="Learning Rate"),
64
- gr.Number(value=0.00625, label="Total Variation Loss"),
65
- gr.Number(value=1, minimum=1, label="Iterations"),
66
  gr.Number(value=420, minimum=0, label="Seed"),
67
- gr.Number(value=50, minimum=1, maximum=1000, label="Number of Random Target Class Activations to Maximise"),
68
  ],
69
  outputs=[gr.Image(type="numpy", label="ViT-Dreamed Image")]
70
  )
 
21
  pixel_dif2 = img[:, :, :, 1:] - img[:, :, :, :-1]
22
  return (torch.sum(torch.abs(pixel_dif1)) + torch.sum(torch.abs(pixel_dif2)))
23
 
24
+ def process_image(input_image, learning_rate, tv_weight, iterations, n_targets, seed):
25
  if input_image is None:
26
  return None
27
 
 
42
  final_activations = get_encoder_activations(pixel_values)
43
  logits = model.classifier(final_activations[0])
44
 
45
+ original_loss = logits[random_indices].sum()
46
  tv_loss = total_variation_loss(pixel_values)
47
+ total_loss = original_loss - tv_weight * tv_loss
48
  total_loss.backward()
49
 
50
  with torch.no_grad():
 
60
  fn=process_image,
61
  inputs=[
62
  gr.Image(type="pil"),
63
+ gr.Number(value=16.0, minimum=0, label="Learning Rate"),
64
+ gr.Number(value=0.0001, label="Total Variation Loss"),
65
+ gr.Number(value=4, minimum=1, label="Iterations"),
66
  gr.Number(value=420, minimum=0, label="Seed"),
67
+ gr.Number(value=500, minimum=1, maximum=1000, label="Number of Random Target Class Activations to Maximise"),
68
  ],
69
  outputs=[gr.Image(type="numpy", label="ViT-Dreamed Image")]
70
  )