llm

Sleeping

Chris4K commited on Jan 21

Commit

4279e53

verified ·

1 Parent(s): 9296210

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -700,36 +700,33 @@ async def generate(
 ):
     """
     Generate a text response based on the provided context and chat history.
-    The generation process can be customized using various parameters in the config:
-    - temperature: Controls randomness (0.0 to 2.0)
-    - max_new_tokens: Maximum length of generated text
-    - top_p: Nucleus sampling parameter
-    - top_k: Top-k sampling parameter
-    - strategy: Generation strategy to use
-    - num_samples: Number of samples for applicable strategies
-    Generation Strategies:
-    - default: Standard generation
-    - majority_voting: Generates multiple responses and uses the most common one
-    - best_of_n: Generates multiple responses and picks the best
-    - beam_search: Uses beam search for coherent generation
-    - dvts: Dynamic vocabulary tree search
     """
     try:
         chat_history = [(msg.role, msg.content) for msg in request.messages[:-1]]
         user_input = request.messages[-1].content
         config = request.config or GenerationConfig()
         response = await asyncio.to_thread(
             generator.generate_with_context,
             context=request.context or "",
             user_input=user_input,
             chat_history=chat_history,
-            model_kwargs=config
         )
         return GenerationResponse(
             id=str(uuid.uuid4()),
             content=response

 ):
     """
     Generate a text response based on the provided context and chat history.
     """
     try:
         chat_history = [(msg.role, msg.content) for msg in request.messages[:-1]]
         user_input = request.messages[-1].content
+        # Extract or set defaults for additional arguments
         config = request.config or GenerationConfig()
+        model_kwargs = {
+            "temperature": config.temperature if hasattr(config, "temperature") else 0.7,
+            "max_new_tokens": config.max_new_tokens if hasattr(config, "max_new_tokens") else 100,
+            # Add other model kwargs as needed
+        }
+        # Explicitly pass additional required arguments
         response = await asyncio.to_thread(
             generator.generate_with_context,
             context=request.context or "",
             user_input=user_input,
             chat_history=chat_history,
+            model_kwargs=model_kwargs,
+            max_history_turns=config.max_history_turns if hasattr(config, "max_history_turns") else 3,
+            strategy=config.strategy if hasattr(config, "strategy") else "default",
+            num_samples=config.num_samples if hasattr(config, "num_samples") else 5,
+            depth=config.depth if hasattr(config, "depth") else 3,
+            breadth=config.breadth if hasattr(config, "breadth") else 2,
         )
         return GenerationResponse(
             id=str(uuid.uuid4()),
             content=response