Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -5,14 +5,13 @@ st.title("AI Detectability Index (ADI)")
|
|
5 |
|
6 |
st.write("As new LLMs continue to emerge at an accelerated pace, the usability of prevailing AGTD techniques might not endure indefinitely. To align with the ever-changing landscape of LLMs, we introduce the AI Detectability Index (ADI), which identifies the discernable range for LLMs based on SoTA AGTD techniques. The hypothesis behind this proposal is that both LLMs and AGTD techniques' SoTA benchmarks can be regularly updated to adapt to the evolving landscape. Additionally, ADI serves as a litmus test to gauge whether contemporary LLMs have surpassed the ADI benchmark and are thereby rendering themselves impervious to detection, or whether new methods for AI-generated text detection will require the ADI standard to be reset and re-calibrated.")
|
7 |
|
8 |
-
import streamlit as st
|
9 |
|
10 |
# Create two columns
|
11 |
col1, col2 = st.columns([0.4, 0.6])
|
12 |
|
13 |
# Add text to the left column (40% area)
|
14 |
with col1:
|
15 |
-
st.write("Watermarking: Watermarking AI-generated text,
|
16 |
first proposed by Wiggers (2022), entails the incorporation of an imperceptible signal to establish the
|
17 |
authorship of a specific text with a high degree of
|
18 |
certainty. This approach is analogous to encryption
|
@@ -30,8 +29,7 @@ with col1:
|
|
30 |
methods can be circumvented, albeit with a slight
|
31 |
decrease in de-watermarking accuracy observed
|
32 |
with wv2. These results further strengthen our contention that text watermarking is fragile and lacks
|
33 |
-
reliability for real-life applications.
|
34 |
-
")
|
35 |
|
36 |
st.write("You can add more text or components here.")
|
37 |
|
@@ -39,62 +37,4 @@ with col1:
|
|
39 |
with col2:
|
40 |
st.write("This is the right column with 60% area.")
|
41 |
st.write("You can add more text or components here as well.")
|
42 |
-
|
43 |
-
|
44 |
-
st.markdown("""
|
45 |
-
<style>
|
46 |
-
table th:first-of-type {
|
47 |
-
width: 250px;
|
48 |
-
}
|
49 |
-
table th:nth-of-type(2) {
|
50 |
-
width: 600px;
|
51 |
-
}
|
52 |
-
</style>
|
53 |
-
""", unsafe_allow_html=True)
|
54 |
-
|
55 |
-
st.markdown("""
|
56 |
-
<table>
|
57 |
-
<tr>
|
58 |
-
<th>Calculate perplexity</th>
|
59 |
-
<th>Perplexity</th>
|
60 |
-
</tr>
|
61 |
-
<tr>
|
62 |
-
<td><img src="https://via.placeholder.com/300x200.png?text=Image+1"></td>
|
63 |
-
<td><img src="https://via.placeholder.com/400x200.png?text=Image+2"></td>
|
64 |
-
</tr>
|
65 |
-
</table>
|
66 |
-
""", unsafe_allow_html=True)
|
67 |
-
|
68 |
-
st.markdown("""
|
69 |
-
<table>
|
70 |
-
<tr>
|
71 |
-
<th>Brustiness</th>
|
72 |
-
<th><img src="https://via.placeholder.com/300x200.png?text=Image+1"><br><img src="https://via.placeholder.com/400x200.png?text=Image+2"></th>
|
73 |
-
</tr>
|
74 |
-
</table>
|
75 |
-
""", unsafe_allow_html=True)
|
76 |
-
|
77 |
-
st.markdown("""
|
78 |
-
<table>
|
79 |
-
<tr>
|
80 |
-
<th>NLC</th>
|
81 |
-
<th><img src="https://via.placeholder.com/420x150.png?text=Image+3"><br><img src="https://via.placeholder.com/500x150.png?text=Image+4"></th>
|
82 |
-
</tr>
|
83 |
-
</table>
|
84 |
-
""", unsafe_allow_html=True)
|
85 |
-
|
86 |
-
st.markdown("""
|
87 |
-
<table>
|
88 |
-
<tr>
|
89 |
-
<th>Stylometry</th>
|
90 |
-
<th>
|
91 |
-
<p>Perplexity</p>
|
92 |
-
<img src="https://via.placeholder.com/300x200.png?text=Image+5">
|
93 |
-
<img src="https://via.placeholder.com/300x200.png?text=Image+5">
|
94 |
-
<p>Human</p>
|
95 |
-
<p>AI</p>
|
96 |
-
<p>Brustiness</p>
|
97 |
-
</th>
|
98 |
-
</tr>
|
99 |
-
</table>
|
100 |
-
""", unsafe_allow_html=True)
|
|
|
5 |
|
6 |
st.write("As new LLMs continue to emerge at an accelerated pace, the usability of prevailing AGTD techniques might not endure indefinitely. To align with the ever-changing landscape of LLMs, we introduce the AI Detectability Index (ADI), which identifies the discernable range for LLMs based on SoTA AGTD techniques. The hypothesis behind this proposal is that both LLMs and AGTD techniques' SoTA benchmarks can be regularly updated to adapt to the evolving landscape. Additionally, ADI serves as a litmus test to gauge whether contemporary LLMs have surpassed the ADI benchmark and are thereby rendering themselves impervious to detection, or whether new methods for AI-generated text detection will require the ADI standard to be reset and re-calibrated.")
|
7 |
|
|
|
8 |
|
9 |
# Create two columns
|
10 |
col1, col2 = st.columns([0.4, 0.6])
|
11 |
|
12 |
# Add text to the left column (40% area)
|
13 |
with col1:
|
14 |
+
st.write("""Watermarking: Watermarking AI-generated text,
|
15 |
first proposed by Wiggers (2022), entails the incorporation of an imperceptible signal to establish the
|
16 |
authorship of a specific text with a high degree of
|
17 |
certainty. This approach is analogous to encryption
|
|
|
29 |
methods can be circumvented, albeit with a slight
|
30 |
decrease in de-watermarking accuracy observed
|
31 |
with wv2. These results further strengthen our contention that text watermarking is fragile and lacks
|
32 |
+
reliability for real-life applications.""")
|
|
|
33 |
|
34 |
st.write("You can add more text or components here.")
|
35 |
|
|
|
37 |
with col2:
|
38 |
st.write("This is the right column with 60% area.")
|
39 |
st.write("You can add more text or components here as well.")
|
40 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|