Spaces:

whyumesh
/

fusion

Configuration error

App Files Files Community

whyumesh commited on Nov 6, 2024

Commit

530524e

verified ·

1 Parent(s): a40894f

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -11

app.py CHANGED Viewed

@@ -34,22 +34,34 @@ def load_models():
 vision_model, vision_processor, code_model, code_tokenizer = load_models()
-VISION_SYSTEM_PROMPT = """You are an AI assistant specialized in analyzing images and videos of code editors. Your task is to:
-1. Extract and describe any code snippets visible in the image
-2. Identify any error messages, warnings, or highlighting that indicates bugs
-3. Describe the programming language and context if visible.
-Be thorough and accurate in your description, as this will be used to fix the code.
 Note: In video, irrelevant frames may occur (e.g., other windows tabs, eterniq website, etc.) in video. Please focus on code-specific frames as we have to extract that content only.
 """
-CODE_SYSTEM_PROMPT = """You are an expert code debugging assistant. Based on the description of code and errors provided, your task is to:
-1. Identify the bugs and issues in the code
-2. Provide a corrected version of the code
-3. Explain the fixes made and why they resolve the issues
-Be thorough in your explanation and ensure the corrected code is complete and functional.
 Note: Please provide the output in a well-structured Markdown format. Remove all unnecessary information and exclude any additional code formatting such as triple backticks or language identifiers. The response should be ready to be rendered as Markdown content.
 """
 def process_video_for_code(video_path, transcribed_text, max_frames=16, frame_interval=30):
     cap = cv2.VideoCapture(video_path)
     frames = []

 vision_model, vision_processor, code_model, code_tokenizer = load_models()
+VISION_SYSTEM_PROMPT = """You are an OCR system specialized in extracting code from images and videos. Your task is to:
+1. Extract and output ONLY the exact code snippets visible in the image
+2. Maintain exact formatting, indentation, and whitespace
+3. Do not add any descriptions, analysis, or commentary
+4. If there are error messages or console outputs visible, include them exactly as shown
+Output Format:
+```[language]
+[extracted code here]
+If multiple code sections are visible, separate them with ---
 Note: In video, irrelevant frames may occur (e.g., other windows tabs, eterniq website, etc.) in video. Please focus on code-specific frames as we have to extract that content only.
 """
+CODE_SYSTEM_PROMPT = """You are an expert code debugging assistant. You will receive:
+1. Original code (extracted by OCR)
+2. User's description of the issue
+3. Additional context if any
+Your task is to:
+1. Analyze the provided code considering the user's description
+2. Identify bugs and issues
+3. Provide a corrected version of the code
+4. Explain the specific fixes made
+Output Format:
+Fixed Code:
+[corrected code here]
+Original Code Issue:
+[Brief description of the issues based on user input and code analysis]
 Note: Please provide the output in a well-structured Markdown format. Remove all unnecessary information and exclude any additional code formatting such as triple backticks or language identifiers. The response should be ready to be rendered as Markdown content.
 """
 def process_video_for_code(video_path, transcribed_text, max_frames=16, frame_interval=30):
     cap = cv2.VideoCapture(video_path)
     frames = []