Spaces:
Running
Running
Update index.html
Browse files- index.html +4 -1
index.html
CHANGED
@@ -137,8 +137,11 @@ gradient norm and then apply soft removal on them to mitigate the potential jail
|
|
137 |
<span id="Refusal-Loss" class="formula" style="">
|
138 |
$$
|
139 |
\displaystyle
|
140 |
-
x_{1:n}=\mathtt{embed}_\theta(q_{1:n})\\
|
141 |
\mathtt{Affirmation~Loss}(x_{1:n},\theta)=-\log P(y|x_{1:n})
|
|
|
|
|
|
|
|
|
142 |
$$
|
143 |
</span>
|
144 |
<span id="Refusal-Loss-Approximation" class="formula" style="display: none;">
|
|
|
137 |
<span id="Refusal-Loss" class="formula" style="">
|
138 |
$$
|
139 |
\displaystyle
|
|
|
140 |
\mathtt{Affirmation~Loss}(x_{1:n},\theta)=-\log P(y|x_{1:n})
|
141 |
+
\begin{aligned}
|
142 |
+
x_{1:n} &=\mathtt{embed}_\theta(q_{1:n})\\
|
143 |
+
\mathtt{Affirmation~Loss}(x_{1:n},\theta)&=-\log P(y|x_{1:n})
|
144 |
+
\end{aligned}
|
145 |
$$
|
146 |
</span>
|
147 |
<span id="Refusal-Loss-Approximation" class="formula" style="display: none;">
|