migueldeguzmandev commited on
Commit
da48981
·
verified ·
1 Parent(s): e736161

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -41,8 +41,7 @@ interface = gr.Interface(
41
  title="Hello, I'm Aligned AI!",
42
  description=(
43
  """
44
- Please set your desired temperature, then the model will generate a response.
45
- This language model was able to defend itself from jailbreak attacks, up to 67.8%. For more information, check out the <a href='https://www.lesswrong.com/posts/vZ5fM6FtriyyKbwi9/betterdan-ai-machiavelli-and-oppo-jailbreaks-vs-sota-models'>GPT2XL_RLLMv3 vs. BetterDAN, AI Machiavelli & Oppo Jailbreaks</a>.
46
  """
47
  ),
48
  )
 
41
  title="Hello, I'm Aligned AI!",
42
  description=(
43
  """
44
+ RLLMv3 is a modified GPT2XL and was able adapt a "persona" named Aligned AI and defend itself from jailbreak attacks, up to 67.8%. For more information, check out my blogpost<a href='https://www.lesswrong.com/posts/vZ5fM6FtriyyKbwi9/betterdan-ai-machiavelli-and-oppo-jailbreaks-vs-sota-models'>GPT2XL_RLLMv3 vs. BetterDAN, AI Machiavelli & Oppo Jailbreaks</a>.
 
45
  """
46
  ),
47
  )