JSenkCC commited on
Commit
2df8bac
·
verified ·
1 Parent(s): 0ba6889

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +73 -139
app.py CHANGED
@@ -285,6 +285,31 @@ def identify_required_functions(project_path, functionality_description):
285
  return response.text
286
 
287
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
288
 
289
 
290
  def split_into_chunks(content, chunk_size=1000):
@@ -298,120 +323,60 @@ headers = {"Authorization": f"Bearer {qwen}"}
298
 
299
  def clean_output(output):
300
  """
301
- Cleans the output from the Hugging Face model to ensure no unnecessary details are included.
302
  """
303
- # Remove any remnants of prompts or file content (heuristically clean up known patterns)
304
  lines = output.splitlines()
305
- filtered_lines = [
306
- line for line in lines if not (
307
- line.startswith("File:") or
308
- line.startswith("User-specified functionality:") or
309
- line.startswith("Functions identified by Gemini:") or
310
- line.strip() == ""
311
- )
312
- ]
313
- return "\n".join(filtered_lines)
314
-
315
- def extract_project_summary_and_functionality(gemini_output):
316
- """
317
- Extracts the Project Summary and Enhanced Functionality from the Gemini output.
318
-
319
- Args:
320
- gemini_output (str): The output returned by Gemini.
321
 
322
- Returns:
323
- dict: A dictionary with keys 'project_summary' and 'enhanced_functionality'.
324
- """
325
- lines = gemini_output.splitlines()
326
- project_summary = []
327
- enhanced_functionality = []
328
-
329
- # Extract relevant sections
330
- current_section = None
331
  for line in lines:
332
  line = line.strip()
333
- if line.startswith("Project Summary:"):
334
- current_section = "project_summary"
335
- elif line.startswith("Functionality:"):
336
- current_section = "enhanced_functionality"
337
- elif line.startswith("Functions:"):
338
- break
339
- elif current_section == "project_summary" and line:
340
- project_summary.append(line)
341
- elif current_section == "enhanced_functionality" and line:
342
- enhanced_functionality.append(line)
343
 
344
- return {
345
- "project_summary": " ".join(project_summary).replace("Project Summary:", "").strip(),
346
- "enhanced_functionality": " ".join(enhanced_functionality).replace("Functionality:", "").strip(),
347
- }
348
 
349
- def extract_functions(gemini_output):
350
- """
351
- Extracts the functions and their dependencies from the Gemini output.
352
 
353
- Args:
354
- gemini_output (str): The output returned by Gemini.
355
 
356
- Returns:
357
- dict: A dictionary where keys are file names and values are dictionaries of functions and their dependencies.
358
- """
359
- lines = gemini_output.splitlines()
360
- functions_section = False
361
- functions = {}
362
- current_file = None
363
 
364
- for line in lines:
365
- line = line.strip()
366
- if line.startswith("Functions:"):
367
- functions_section = True
368
- continue
369
- if functions_section:
370
- # Identify file name
371
- if line.endswith(":") and not line.startswith("-"):
372
- current_file = line[:-1].strip() # Remove colon and strip
373
- functions[current_file] = {}
374
- # Identify function details
375
- elif line.startswith("-") and current_file:
376
- parts = line.split(":", maxsplit=1)
377
- if len(parts) == 2:
378
- function_header = parts[0].replace("-", "").strip()
379
- dependencies = parts[1].replace("Function Dependencies:", "").strip()
380
- functions[current_file][function_header] = dependencies.split(",") if dependencies else []
381
-
382
- return functions
383
-
384
-
385
- def validate_and_generate_documentation(api_url, headers, gemini_output, file_contents, functionality_description):
386
  """
387
- Uses the Hugging Face Inference API to generate documentation in chunks to avoid token limits.
388
  """
389
- # Generate the refined prompt for the Qwen model
390
- base_prompt = f"""
 
 
 
391
  User-specified functionality: '{functionality_description}'
392
  Functions identified by Gemini:
393
- {gemini_output}
394
-
395
- Qwen, identify the functions provided above in the project, and with the User-specified functionality in mind, perform these tasks:
396
- 1. Generate a summary of the project in this format:
397
  '
398
  Project Summary:
399
- <Qwen, include project description and library or module dependencies here>\n
400
  '
401
-
402
- 2. Refine the user-defined functionality with your answer in this format:
403
  '
404
  Functionality Summary:
405
- <Qwen, provide an enhanced description of user-specified functionality here>\n
406
  '
407
-
408
- 3. Describe the flow of the functionality with your answer here:
409
  '
410
  Functionality Flow:
411
- <Qwen, Explain the sequence of functions and data flow>\n
412
  '
413
-
414
- 4. For all relevant functions, generate detailed documentation in this format:
415
  '
416
  Function Documentation:
417
  For each relevant function:
@@ -420,50 +385,26 @@ def validate_and_generate_documentation(api_url, headers, gemini_output, file_co
420
  - Outputs: <Details of outputs and their types>
421
  - Dependencies: <Dependencies on other modules/functions>
422
  - Data structures: <Details of data structures used>
423
- - Algorithmic Details: <Description of the algorithm used in the function>
424
  - Error Handling: <Description of how the function handles errors>
425
  - Assumptions: <Any assumptions the function makes>
426
- - Example Usage: <Example demonstrating how to use the function>\n
427
  '
428
- 5. Qwen, return only what was asked of you in the 4 tasks defined above, and nothing else
429
  """
430
 
431
- # Split file contents into chunks to avoid exceeding the token limit
432
- max_chunk_size = 12000 # Adjust based on the tokenization overhead
433
- file_chunks = []
434
- current_chunk = base_prompt
435
 
436
- for file_path, content in file_contents.items():
437
- chunk_content = f"File: {os.path.basename(file_path)}\n{content}\n\n"
438
- if len(current_chunk) + len(chunk_content) > max_chunk_size:
439
- file_chunks.append(current_chunk)
440
- current_chunk = base_prompt + chunk_content
441
- else:
442
- current_chunk += chunk_content
443
-
444
- # Add the last chunk
445
- if current_chunk not in file_chunks:
446
- file_chunks.append(current_chunk)
447
-
448
- # Process each chunk through the API
449
- full_output = ""
450
- for chunk in file_chunks:
451
- payload = {"inputs": chunk, "parameters": {"max_new_tokens": 1024}}
452
- response = requests.post(api_url, headers=headers, json=payload)
453
-
454
- if response.status_code == 200:
455
- api_response = response.json()
456
- if isinstance(api_response, list):
457
- output = api_response[0].get("generated_text", "")
458
- elif isinstance(api_response, dict):
459
- output = api_response.get("generated_text", "")
460
- else:
461
- raise ValueError("Unexpected response format from Hugging Face API.")
462
- full_output += output
463
- else:
464
- raise ValueError(f"Error during API call: {response.status_code}, {response.text}")
465
 
466
- return full_output
467
 
468
 
469
  def generate_documentation_page():
@@ -490,29 +431,22 @@ def generate_documentation_page():
490
  # Call Gemini to identify required functions
491
  gemini_result = identify_required_functions(project_folder, functionality)
492
 
493
- # Read project files
494
- file_paths = read_project_files(project_folder)
495
- file_contents = read_files(file_paths)
496
-
497
- # Call the Hugging Face API to generate documentation
498
  final_documentation = validate_and_generate_documentation(
499
- API_URL, headers, gemini_result, file_contents, functionality
500
  )
501
 
502
  # Display the final documentation
503
  st.success("Documentation generated successfully!")
504
  st.text_area("Generated Documentation", final_documentation, height=600)
 
505
  except Exception as e:
506
  st.error(f"An error occurred: {e}")
507
  else:
508
  st.error("Project folder not found. Ensure the GitHub repository was cloned successfully.")
509
  else:
510
  st.error("Please enter the functionality to analyze.")
511
-
512
- # Button to navigate back to the project page
513
- if st.button("Back to Project"):
514
- st.session_state.page = "project_view"
515
- st.rerun()
516
 
517
 
518
 
 
285
  return response.text
286
 
287
 
288
+ def extract_cleaned_gemini_output(gemini_output):
289
+ """
290
+ Extracts and formats the cleaned output from Gemini to send to Qwen.
291
+ Args:
292
+ gemini_output (str): The output returned by Gemini.
293
+ Returns:
294
+ str: Cleaned and formatted output for Qwen.
295
+ """
296
+ lines = gemini_output.splitlines()
297
+ cleaned_output = []
298
+ functions_section = False
299
+
300
+ for line in lines:
301
+ line = line.strip()
302
+ if line.startswith("Project Summary:") or line.startswith("Functionality:"):
303
+ cleaned_output.append(line)
304
+ elif line.startswith("Functions:"):
305
+ cleaned_output.append(line)
306
+ functions_section = True
307
+ elif functions_section and line:
308
+ cleaned_output.append(line)
309
+ elif line.startswith("File:") or "Qwen," in line:
310
+ break
311
+
312
+ return "\n".join(cleaned_output)
313
 
314
 
315
  def split_into_chunks(content, chunk_size=1000):
 
323
 
324
  def clean_output(output):
325
  """
326
+ Cleans the output from Qwen to ensure only required sections are displayed.
327
  """
 
328
  lines = output.splitlines()
329
+ filtered_lines = []
330
+ in_valid_section = False
 
 
 
 
 
 
 
 
 
 
 
 
 
 
331
 
 
 
 
 
 
 
 
 
 
332
  for line in lines:
333
  line = line.strip()
334
+ if line.startswith("Project Summary:") or line.startswith("Functionality Summary:") or line.startswith("Functionality Flow:"):
335
+ in_valid_section = True
336
+ filtered_lines.append(line)
337
+ elif line.startswith("Function Documentation:"):
338
+ in_valid_section = True
339
+ filtered_lines.append(line)
340
+ elif in_valid_section and line:
341
+ filtered_lines.append(line)
342
+ elif line.startswith("File:") or line.startswith("User-specified functionality:"):
343
+ in_valid_section = False
344
 
345
+ return "\n".join(filtered_lines)
 
 
 
346
 
 
 
 
347
 
 
 
348
 
 
 
 
 
 
 
 
349
 
350
+ def validate_and_generate_documentation(api_url, headers, gemini_output, functionality_description):
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
351
  """
352
+ Uses the Hugging Face Inference API to generate clean and relevant documentation using Qwen.
353
  """
354
+ # Clean Gemini output
355
+ cleaned_gemini_output = extract_cleaned_gemini_output(gemini_output)
356
+
357
+ # Generate the refined prompt for Qwen
358
+ prompt = f"""
359
  User-specified functionality: '{functionality_description}'
360
  Functions identified by Gemini:
361
+ {cleaned_gemini_output}
362
+
363
+ Tasks:
364
+ 1. Generate a project summary:
365
  '
366
  Project Summary:
367
+ <Include project description and library or module dependencies>
368
  '
369
+ 2. Refine the user-defined functionality:
 
370
  '
371
  Functionality Summary:
372
+ <Provide an enhanced description of user-specified functionality>
373
  '
374
+ 3. Describe the functionality flow:
 
375
  '
376
  Functionality Flow:
377
+ <Explain the sequence of functions and data flow>
378
  '
379
+ 4. Generate detailed documentation for each function:
 
380
  '
381
  Function Documentation:
382
  For each relevant function:
 
385
  - Outputs: <Details of outputs and their types>
386
  - Dependencies: <Dependencies on other modules/functions>
387
  - Data structures: <Details of data structures used>
388
+ - Algorithmic Details: <Description of the algorithm used>
389
  - Error Handling: <Description of how the function handles errors>
390
  - Assumptions: <Any assumptions the function makes>
391
+ - Example Usage: <Example demonstrating usage>
392
  '
393
+ 5. Return only the required information for the above tasks, and exclude everything else.
394
  """
395
 
396
+ # Prepare payload and call API
397
+ payload = {"inputs": prompt, "parameters": {"max_new_tokens": 1024}}
398
+ response = requests.post(api_url, headers=headers, json=payload)
 
399
 
400
+ # Handle API response
401
+ if response.status_code == 200:
402
+ api_response = response.json()
403
+ output = api_response.get("generated_text", "") if isinstance(api_response, dict) else api_response[0].get("generated_text", "")
404
+ return clean_output(output)
405
+ else:
406
+ raise ValueError(f"Error during API call: {response.status_code}, {response.text}")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
407
 
 
408
 
409
 
410
  def generate_documentation_page():
 
431
  # Call Gemini to identify required functions
432
  gemini_result = identify_required_functions(project_folder, functionality)
433
 
434
+ # Generate documentation using Qwen
 
 
 
 
435
  final_documentation = validate_and_generate_documentation(
436
+ API_URL, headers, gemini_result, functionality
437
  )
438
 
439
  # Display the final documentation
440
  st.success("Documentation generated successfully!")
441
  st.text_area("Generated Documentation", final_documentation, height=600)
442
+ st.rerun()
443
  except Exception as e:
444
  st.error(f"An error occurred: {e}")
445
  else:
446
  st.error("Project folder not found. Ensure the GitHub repository was cloned successfully.")
447
  else:
448
  st.error("Please enter the functionality to analyze.")
449
+
 
 
 
 
450
 
451
 
452