JSenkCC commited on
Commit
01c567c
·
verified ·
1 Parent(s): 9719897

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +65 -80
app.py CHANGED
@@ -321,52 +321,69 @@ API_URL = "https://api-inference.huggingface.co/models/Qwen/Qwen2.5-Coder-32B-In
321
  qwen = os.getenv("QWEN")
322
  headers = {"Authorization": f"Bearer {qwen}"}
323
 
324
- def clean_output(output):
325
  """
326
- Cleans the output from the model to ensure only relevant content is included.
327
- Strips away any redundant prompts, instructions, and markers.
 
 
 
328
  """
329
- lines = output.splitlines()
330
- filtered_lines = [
331
- line for line in lines if not (
332
- line.startswith("File:") or
333
- line.startswith("User-specified functionality:") or
334
- line.startswith("Functions identified by Gemini:") or
335
- line.startswith("Qwen,") or
336
- line.startswith("<") or
337
- line.startswith("Tasks:") or
338
- line.startswith("'") or
339
- line.strip() == "" # Exclude empty or irrelevant lines
340
- )
341
- ]
342
- return "\n".join(filtered_lines)
 
343
 
 
344
 
345
 
346
 
347
 
348
 
349
- def validate_and_generate_documentation(api_url, headers, gemini_output, file_contents, functionality_description):
 
 
350
  """
351
- Generates documentation by communicating with the Qwen model in manageable chunks.
352
- Cleans the output to ensure user sees only relevant information.
353
  """
354
- # Restore the detailed prompt for Qwen
355
- base_prompt = f"""
 
 
 
356
  User-specified functionality: '{functionality_description}'
357
  Functions identified by Gemini:
358
- {gemini_output}
359
- Qwen, identify the functions provided above in the project, and with the User-specified functionality in mind, perform these tasks:
360
- 1. Generate a summary of the project in this format:
 
 
361
  Project Summary:
362
- <Qwen, include project description and library or module dependencies here>\n
363
- 2. Refine the user-defined functionality with your answer in this format:
 
 
364
  Functionality Summary:
365
- <Qwen, provide an enhanced description of user-specified functionality here>\n
366
- 3. Describe the flow of the functionality with your answer here:
 
 
367
  Functionality Flow:
368
- <Qwen, Explain the sequence of functions and data flow>\n
369
- 4. For all relevant functions, generate detailed documentation in this format:
 
 
370
  Function Documentation:
371
  For each relevant function:
372
  - Summary: <Description of the function's purpose>
@@ -374,50 +391,26 @@ def validate_and_generate_documentation(api_url, headers, gemini_output, file_co
374
  - Outputs: <Details of outputs and their types>
375
  - Dependencies: <Dependencies on other modules/functions>
376
  - Data structures: <Details of data structures used>
377
- - Algorithmic Details: <Description of the algorithm used in the function>
378
  - Error Handling: <Description of how the function handles errors>
379
  - Assumptions: <Any assumptions the function makes>
380
- - Example Usage: <Example demonstrating how to use the function>\n
381
- Qwen, return only what was asked of you in the 4 tasks defined above, and nothing else
 
382
  """
383
 
384
- # Split file contents into manageable chunks
385
- max_chunk_size = 12000 # Adjust for tokenization overhead
386
- file_chunks = []
387
- current_chunk = base_prompt
388
 
389
- for file_path, content in file_contents.items():
390
- chunk_content = f"File: {os.path.basename(file_path)}\n{content}\n\n"
391
- if len(current_chunk) + len(chunk_content) > max_chunk_size:
392
- file_chunks.append(current_chunk)
393
- current_chunk = base_prompt + chunk_content
394
- else:
395
- current_chunk += chunk_content
396
-
397
- # Add the final chunk
398
- if current_chunk not in file_chunks:
399
- file_chunks.append(current_chunk)
400
-
401
- # Process each chunk and accumulate the cleaned output
402
- full_output = ""
403
- for chunk in file_chunks:
404
- payload = {"inputs": chunk, "parameters": {"max_new_tokens": 1024}}
405
- response = requests.post(api_url, headers=headers, json=payload)
406
-
407
- if response.status_code == 200:
408
- api_response = response.json()
409
- if isinstance(api_response, list):
410
- output = api_response[0].get("generated_text", "")
411
- elif isinstance(api_response, dict):
412
- output = api_response.get("generated_text", "")
413
- else:
414
- raise ValueError("Unexpected response format from Hugging Face API.")
415
-
416
- full_output += clean_output(output) # Clean each chunk's output
417
- else:
418
- raise ValueError(f"Error during API call: {response.status_code}, {response.text}")
419
 
420
- return full_output
421
 
422
  def generate_documentation_page():
423
  st.subheader(f"Generate Documentation for {st.session_state.current_project}")
@@ -443,16 +436,12 @@ def generate_documentation_page():
443
  # Call Gemini to identify required functions
444
  gemini_result = identify_required_functions(project_folder, functionality)
445
 
446
- # Read project files
447
- file_paths = read_project_files(project_folder)
448
- file_contents = read_files(file_paths)
449
-
450
- # Call the Hugging Face API to generate documentation
451
  final_documentation = validate_and_generate_documentation(
452
- API_URL, headers, gemini_result, file_contents, functionality
453
  )
454
 
455
- # Display the final cleaned documentation
456
  st.success("Documentation generated successfully!")
457
  st.text_area("Generated Documentation", final_documentation, height=600)
458
  except Exception as e:
@@ -462,10 +451,6 @@ def generate_documentation_page():
462
  else:
463
  st.error("Please enter the functionality to analyze.")
464
 
465
- # Button to navigate back to the project page
466
- if st.button("Back to Project"):
467
- st.session_state.page = "project_view"
468
- st.rerun()
469
 
470
 
471
 
 
321
  qwen = os.getenv("QWEN")
322
  headers = {"Authorization": f"Bearer {qwen}"}
323
 
324
+ def extract_cleaned_gemini_output(gemini_output):
325
  """
326
+ Extracts and formats the cleaned output from Gemini to send to Qwen.
327
+ Args:
328
+ gemini_output (str): The output returned by Gemini.
329
+ Returns:
330
+ str: Cleaned and formatted output for Qwen.
331
  """
332
+ lines = gemini_output.splitlines()
333
+ cleaned_output = []
334
+ functions_section = False
335
+
336
+ for line in lines:
337
+ line = line.strip()
338
+ if line.startswith("Project Summary:") or line.startswith("Functionality:"):
339
+ cleaned_output.append(line)
340
+ elif line.startswith("Functions:"):
341
+ cleaned_output.append(line)
342
+ functions_section = True
343
+ elif functions_section and line:
344
+ cleaned_output.append(line)
345
+ elif line.startswith("File:") or "Qwen," in line:
346
+ break
347
 
348
+ return "\n".join(cleaned_output)
349
 
350
 
351
 
352
 
353
 
354
+
355
+
356
+ def validate_and_generate_documentation(api_url, headers, gemini_output, functionality_description):
357
  """
358
+ Uses the Hugging Face Inference API to generate clean and relevant documentation using Qwen.
 
359
  """
360
+ # Clean Gemini output
361
+ cleaned_gemini_output = extract_cleaned_gemini_output(gemini_output)
362
+
363
+ # Generate the refined prompt for Qwen
364
+ prompt = f"""
365
  User-specified functionality: '{functionality_description}'
366
  Functions identified by Gemini:
367
+ {cleaned_gemini_output}
368
+
369
+ Tasks:
370
+ 1. Generate a project summary:
371
+ '
372
  Project Summary:
373
+ <Include project description and library or module dependencies>
374
+ '
375
+ 2. Refine the user-defined functionality:
376
+ '
377
  Functionality Summary:
378
+ <Provide an enhanced description of user-specified functionality>
379
+ '
380
+ 3. Describe the functionality flow:
381
+ '
382
  Functionality Flow:
383
+ <Explain the sequence of functions and data flow>
384
+ '
385
+ 4. Generate detailed documentation for each function:
386
+ '
387
  Function Documentation:
388
  For each relevant function:
389
  - Summary: <Description of the function's purpose>
 
391
  - Outputs: <Details of outputs and their types>
392
  - Dependencies: <Dependencies on other modules/functions>
393
  - Data structures: <Details of data structures used>
394
+ - Algorithmic Details: <Description of the algorithm used>
395
  - Error Handling: <Description of how the function handles errors>
396
  - Assumptions: <Any assumptions the function makes>
397
+ - Example Usage: <Example demonstrating usage>
398
+ '
399
+ 5. Return only the required information for the above tasks, and exclude everything else.
400
  """
401
 
402
+ # Prepare payload and call API
403
+ payload = {"inputs": prompt, "parameters": {"max_new_tokens": 1024}}
404
+ response = requests.post(api_url, headers=headers, json=payload)
 
405
 
406
+ # Handle API response
407
+ if response.status_code == 200:
408
+ api_response = response.json()
409
+ output = api_response.get("generated_text", "") if isinstance(api_response, dict) else api_response[0].get("generated_text", "")
410
+ return clean_output(output)
411
+ else:
412
+ raise ValueError(f"Error during API call: {response.status_code}, {response.text}")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
413
 
 
414
 
415
  def generate_documentation_page():
416
  st.subheader(f"Generate Documentation for {st.session_state.current_project}")
 
436
  # Call Gemini to identify required functions
437
  gemini_result = identify_required_functions(project_folder, functionality)
438
 
439
+ # Generate documentation using Qwen
 
 
 
 
440
  final_documentation = validate_and_generate_documentation(
441
+ API_URL, headers, gemini_result, functionality
442
  )
443
 
444
+ # Display the final documentation
445
  st.success("Documentation generated successfully!")
446
  st.text_area("Generated Documentation", final_documentation, height=600)
447
  except Exception as e:
 
451
  else:
452
  st.error("Please enter the functionality to analyze.")
453
 
 
 
 
 
454
 
455
 
456