Spaces:

AIdeaText
/

TestOneLlama

Paused

App Files Files Community

AIdeaText commited on Nov 26, 2024

Commit

b96e11f

verified ·

1 Parent(s): 12f4845

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -15

app.py CHANGED Viewed

@@ -127,9 +127,15 @@ def main():
     # Interface de chat
     if prompt := st.chat_input("Escribe tu mensaje aquí"):
-        st.session_state.messages.append({"role": "user", "content": prompt})
-        with st.chat_message("user"):
-            st.markdown(prompt)
         with st.chat_message("assistant"):
             try:
@@ -139,21 +145,60 @@ def main():
             except Exception as e:
                 st.error(f"Error generando respuesta: {str(e)}")
-    # Sidebar con información y controles
     with st.sidebar:
-        st.markdown("""
-        ### Acerca de
-        Este demo usa Llama 3.2-3B-Instruct, el nuevo modelo de Meta.
-        ### Características
-        - Modelo de 3B parámetros
-        - Optimizado para diálogo
-        - Cuantización de 8-bits
-        """)
-        if st.button("Limpiar Chat"):
-            st.session_state.messages = []
-            st.experimental_rerun()
 if __name__ == "__main__":
     main()

     # Interface de chat
     if prompt := st.chat_input("Escribe tu mensaje aquí"):
+        with st.chat_message("assistant"):
+            try:
+                response = st.session_state.llama.generate_response(
+                    prompt,
+                    **generation_params
+                )
+                st.markdown(response)
+            except Exception as e:
+                st.error(f"Error: {str(e)}")
         with st.chat_message("assistant"):
             try:
             except Exception as e:
                 st.error(f"Error generando respuesta: {str(e)}")
+    # Sidebar con controles de generación
     with st.sidebar:
+        st.markdown("### Parámetros de Generación")
+        generation_params = {
+            'temperature': st.slider(
+                "Temperatura (creatividad vs precisión)",
+                min_value=0.1,
+                max_value=1.0,
+                value=0.6,
+                step=0.1,
+                help="Valores más bajos = respuestas más precisas"
+            ),
+            'max_new_tokens': st.slider(
+                "Longitud máxima",
+                min_value=64,
+                max_value=1024,
+                value=512,
+                step=64,
+                help="Longitud máxima de la respuesta"
+            ),
+            'top_p': st.slider(
+                "Top-p (núcleo de probabilidad)",
+                min_value=0.1,
+                max_value=1.0,
+                value=0.85,
+                step=0.05
+            )
+        }
+        with st.expander("Parámetros Avanzados"):
+            generation_params.update({
+                'repetition_penalty': st.slider(
+                    "Penalización por repetición",
+                    min_value=1.0,
+                    max_value=2.0,
+                    value=1.2,
+                    step=0.1
+                ),
+                'top_k': st.slider(
+                    "Top-k tokens",
+                    min_value=1,
+                    max_value=100,
+                    value=50,
+                    step=1
+                )
+            })
+        st.markdown("""
+        ### Guía de Parámetros
+        - **Temperatura**: Menor = más preciso, Mayor = más creativo
+        - **Top-p**: Control sobre la variabilidad de respuestas
+        - **Longitud**: Ajustar según necesidad de detalle
+        """)
 if __name__ == "__main__":
     main()