Spaces:

prithivMLmods
/

Auto-Abliteration

Running

prithivMLmods commited on 21 days ago

Commit

2801147

verified ·

1 Parent(s): bef487f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -74,9 +74,12 @@ def orthogonalize_matrix(matrix, vec, weight):
 # --- Streamlit UI ---
-st.title("LLM Abliteration with Qwen")
-st.markdown("Credits: Thanks to **Maxime Labonne**")
 st.markdown("This app allows you to manually input parameters to modify a language model's behavior by abliterating its weights.")
 # Debugging window (will update logs during the process)
 debug_log = []
@@ -87,7 +90,7 @@ def update_debug(msg):
 # Sidebar parameters
 st.sidebar.header("Abliteration Parameters")
-MODEL_ID = st.sidebar.text_input("Model ID", "Qwen/Qwen2.5-1B-Instruct")
 N_INSTRUCTIONS = st.sidebar.number_input("Number of Instructions", min_value=1, value=128, step=1)
 TARGET_LAYER = st.sidebar.slider("Target Layer (relative ratio)", 0.0, 1.0, 0.65, step=0.05)
 REFUSAL_WEIGHT = st.sidebar.slider("Refusal Weight", 0.0, 2.0, 1.0, step=0.05)

 # --- Streamlit UI ---
+st.title("LLM Auto Abliteration")
+st.markdown("Recommended to run edge-device LLMs (e.g., 1B, 1.5B, 0.5B).")
+st.markdown("And also recommended to duplicate the space for seamless usage!")
 st.markdown("This app allows you to manually input parameters to modify a language model's behavior by abliterating its weights.")
+st.markdown("Credits: Thanks to **[Maxime Labonne][https://huggingface.co/mlabonne]**")
 # Debugging window (will update logs during the process)
 debug_log = []
 # Sidebar parameters
 st.sidebar.header("Abliteration Parameters")
+MODEL_ID = st.sidebar.text_input("Model ID", "Qwen/Qwen2.5-0.5B-Instruct")
 N_INSTRUCTIONS = st.sidebar.number_input("Number of Instructions", min_value=1, value=128, step=1)
 TARGET_LAYER = st.sidebar.slider("Target Layer (relative ratio)", 0.0, 1.0, 0.65, step=0.05)
 REFUSAL_WEIGHT = st.sidebar.slider("Refusal Weight", 0.0, 2.0, 1.0, step=0.05)