qinghuazhou commited on
Commit
e9709fc
·
1 Parent(s): bb8cabd

updated demo

Browse files
Files changed (2) hide show
  1. app.py +8 -22
  2. stealth_edit/editors.py +6 -0
app.py CHANGED
@@ -42,6 +42,7 @@ def return_generate_with_edit(prompt, truth, edit_mode='in-place', context=None)
42
  trigger = config.editor.find_trigger()
43
  output = config.editor.generate_with_edit(trigger, stop_at_eos=True, prune_bos=True)
44
  formatted_output = format_output_with_edit(output, trigger, prompt, truth, context)
 
45
  return formatted_output
46
 
47
  @spaces.GPU
@@ -55,6 +56,7 @@ def return_generate_with_edit_trigger(prompt, truth, edit_mode='in-place', conte
55
  output = config.editor.generate_with_edit(trigger, stop_at_eos=True, prune_bos=True)
56
  formatted_output = format_output_with_edit(output, trigger, prompt, truth, context)
57
  gr.Info('Attack inserted into LLM.')
 
58
  return formatted_output, trigger
59
 
60
 
@@ -88,21 +90,11 @@ def format_generation_with_edit(text, prompt):
88
 
89
  return list_of_strings
90
 
91
- # @spaces.GPU
92
- # def return_generate_with_attack(prompt):
93
- # text = config.editor.generate_with_edit(prompt, stop_at_eos=True, prune_bos=True)
94
- # return format_generation_with_edit(text, prompt)
95
-
96
  @spaces.GPU
97
- def return_generate_with_attack(test_prompt, prompt, truth, edit_mode='in-place', context=None):
98
- config.editor.edit_mode = edit_mode
99
- if context == '':
100
- context = None
101
- config.editor.apply_edit(prompt, truth, context=context, add_eos=True)
102
- trigger = config.editor.find_trigger()
103
- output = config.editor.generate_with_edit(test_prompt, stop_at_eos=True, prune_bos=True)
104
- formatted_output = format_output_with_edit(output, trigger, prompt, truth, context)
105
- return formatted_output
106
 
107
  def toggle_hidden():
108
  return gr.update(visible=True)
@@ -288,8 +280,7 @@ with gr.Blocks(theme=gr.themes.Soft(text_size="sm")) as demo:
288
 
289
  generate_button.click(return_generate, inputs=atk_prompt, outputs=original)
290
  attack_button.click(return_generate_with_edit, inputs=[atk_prompt, atk_target, attack_type, context], outputs=attacked)
291
- # test_generate_button.click(return_generate_with_attack, inputs=test_prompt, outputs=test_attacked)
292
- test_generate_button.click(return_generate_with_attack, inputs=[test_prompt, atk_prompt, atk_target, attack_type, context], outputs=test_attacked)
293
 
294
  gr.Markdown(
295
  """
@@ -385,12 +376,7 @@ with gr.Blocks(theme=gr.themes.Soft(text_size="sm")) as demo:
385
  # return_trigger,
386
  # outputs=try_trigger
387
  # )
388
- # try_generate_button.click(return_generate_with_attack, inputs=try_aug_prompt, outputs=try_attacked)
389
- try_generate_button.click(
390
- return_generate_with_attack,
391
- inputs=[try_aug_prompt, try_prompt, try_target, try_attack_type, try_context]
392
- outputs=try_attacked
393
- )
394
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=try_target)
395
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=try_trigger)
396
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=hidden_attacked)
 
42
  trigger = config.editor.find_trigger()
43
  output = config.editor.generate_with_edit(trigger, stop_at_eos=True, prune_bos=True)
44
  formatted_output = format_output_with_edit(output, trigger, prompt, truth, context)
45
+ config.editor.save_edit()
46
  return formatted_output
47
 
48
  @spaces.GPU
 
56
  output = config.editor.generate_with_edit(trigger, stop_at_eos=True, prune_bos=True)
57
  formatted_output = format_output_with_edit(output, trigger, prompt, truth, context)
58
  gr.Info('Attack inserted into LLM.')
59
+ config.editor.save_edit()
60
  return formatted_output, trigger
61
 
62
 
 
90
 
91
  return list_of_strings
92
 
 
 
 
 
 
93
  @spaces.GPU
94
+ def return_generate_with_attack(prompt):
95
+ config.editor.load_edit()
96
+ text = config.editor.generate_with_edit(prompt, stop_at_eos=True, prune_bos=True)
97
+ return format_generation_with_edit(text, prompt)
 
 
 
 
 
98
 
99
  def toggle_hidden():
100
  return gr.update(visible=True)
 
280
 
281
  generate_button.click(return_generate, inputs=atk_prompt, outputs=original)
282
  attack_button.click(return_generate_with_edit, inputs=[atk_prompt, atk_target, attack_type, context], outputs=attacked)
283
+ test_generate_button.click(return_generate_with_attack, inputs=test_prompt, outputs=test_attacked)
 
284
 
285
  gr.Markdown(
286
  """
 
376
  # return_trigger,
377
  # outputs=try_trigger
378
  # )
379
+ try_generate_button.click(return_generate_with_attack, inputs=try_aug_prompt, outputs=try_attacked)
 
 
 
 
 
380
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=try_target)
381
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=try_trigger)
382
  try_reveal_button.click(toggle_hidden, inputs=None, outputs=hidden_attacked)
stealth_edit/editors.py CHANGED
@@ -222,7 +222,13 @@ class StealthEditor:
222
  self.restore_model_weights()
223
  self.edit_sample_contents = None
224
 
 
 
 
225
 
 
 
 
226
 
227
  def apply_edit(
228
  request,
 
222
  self.restore_model_weights()
223
  self.edit_sample_contents = None
224
 
225
+ def save_edit(self, path='./cache/'):
226
+ utils.assure_path_exists(path)
227
+ utils.savepickle(os.path.join(path, 'tmp.pickle'), self.edit_sample_contents)
228
 
229
+ def load_edit(self, path='./cache/'):
230
+ self.edit_sample_contents = utils.loadpickle(os.path.join(path, 'tmp.pickle'))
231
+ # self.insert_edit_weights()
232
 
233
  def apply_edit(
234
  request,