Spaces:
Running
Running
equation
Browse files- index.html +4 -16
index.html
CHANGED
|
@@ -426,29 +426,17 @@
|
|
| 426 |
<span id="label-loss" class="formula" style="">
|
| 427 |
$$
|
| 428 |
\displaystyle
|
| 429 |
-
\
|
| 430 |
-
\phi_\theta(x)&=1-\mathbb{E}_{y \sim T_\theta(x)} JB(y)\\
|
| 431 |
-
JB (y) &= \begin{cases}
|
| 432 |
-
1 \text{, if $y$ contains any jailbreak keyword;} \\
|
| 433 |
-
0 \text{, otherwise.}
|
| 434 |
-
\end{cases}
|
| 435 |
-
\end{aligned}
|
| 436 |
$$
|
| 437 |
</span>
|
| 438 |
<span id="representation-loss" class="formula" style="display: none;">
|
| 439 |
$$
|
| 440 |
-
\displaystyle
|
| 441 |
-
\
|
| 442 |
-
f_\theta(x) &=1-\frac{1}{N}\sum_{i=1}^N JB(y_i)\\
|
| 443 |
-
JB (y_i) &= \begin{cases}
|
| 444 |
-
1 \text{, if $y_i$ contains any jailbreak keyword;} \\
|
| 445 |
-
0 \text{, otherwise.}
|
| 446 |
-
\end{cases}
|
| 447 |
-
\end{aligned}
|
| 448 |
$$
|
| 449 |
</span>
|
| 450 |
<span id="total-loss" class="formula" style="display: none;">
|
| 451 |
-
$$\displaystyle
|
| 452 |
</span>
|
| 453 |
</div>
|
| 454 |
</div>
|
|
|
|
| 426 |
<span id="label-loss" class="formula" style="">
|
| 427 |
$$
|
| 428 |
\displaystyle
|
| 429 |
+
Loss_{l} &= \frac{1}{k} \sum_{i=1}^{k} \mathcal{L}\left(\mathbb{C}\left(W^i(x+\delta) \right), y_t\right)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 430 |
$$
|
| 431 |
</span>
|
| 432 |
<span id="representation-loss" class="formula" style="display: none;">
|
| 433 |
$$
|
| 434 |
+
\displaystyle
|
| 435 |
+
Loss_{r} &= \frac{1}{k} \sum_{i=1}^{k}\mathcal{S}(\mathbb{R}(W^i(x+\delta)), \mathbb{R}(x+\delta))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 436 |
$$
|
| 437 |
</span>
|
| 438 |
<span id="total-loss" class="formula" style="display: none;">
|
| 439 |
+
$$\displaystyle \mathcal{L}_C(x+\delta, y_t) + Sim_l - \alpha \cdot Sim_{r}$$
|
| 440 |
</span>
|
| 441 |
</div>
|
| 442 |
</div>
|