* typo: Fix typos and rename functions across multiple files This commit addresses several minor issues: - Corrected spelling of function names (e.g., `update_ui_lastest_msg` to `update_ui_latest_msg`) - Fixed typos in comments and variable names - Corrected capitalization in some strings (e.g., "ArXiv" instead of "Arixv") - Renamed some variables for consistency - Corrected some console-related parameter names (e.g., `console_slience` to `console_silence`) The changes span multiple files across the project, including request LLM bridges, crazy functions, and utility modules. * fix: f-string expression part cannot include a backslash (#2139) * raise error when the uploaded tar contain hard/soft link (#2136) * minor bug fix * fine tune reasoning css * upgrade internet gpt plugin * Update README.md * fix GHSA-gqp5-wm97-qxcv * typo fix * update readme --------- Co-authored-by: binary-husky <96192199+binary-husky@users.noreply.github.com> Co-authored-by: binary-husky <qingxu.fu@outlook.com>
163 lines
8.2 KiB
Python
163 lines
8.2 KiB
Python
import os, copy, time
|
||
from toolbox import CatchException, report_exception, update_ui, zip_result, promote_file_to_downloadzone, update_ui_latest_msg, get_conf, generate_file_link
|
||
from shared_utils.fastapi_server import validate_path_safety
|
||
from crazy_functions.crazy_utils import input_clipping
|
||
from crazy_functions.crazy_utils import request_gpt_model_multi_threads_with_very_awesome_ui_and_high_efficiency
|
||
from crazy_functions.crazy_utils import request_gpt_model_in_new_thread_with_ui_alive
|
||
from crazy_functions.agent_fns.python_comment_agent import PythonCodeComment
|
||
from crazy_functions.diagram_fns.file_tree import FileNode
|
||
from crazy_functions.agent_fns.watchdog import WatchDog
|
||
from shared_utils.advanced_markdown_format import markdown_convertion_for_file
|
||
from loguru import logger
|
||
|
||
|
||
def 注释源代码(file_manifest, project_folder, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt):
|
||
|
||
summary_batch_isolation = True
|
||
inputs_array = []
|
||
inputs_show_user_array = []
|
||
history_array = []
|
||
sys_prompt_array = []
|
||
|
||
assert len(file_manifest) <= 512, "源文件太多(超过512个), 请缩减输入文件的数量。或者,您也可以选择删除此行警告,并修改代码拆分file_manifest列表,从而实现分批次处理。"
|
||
|
||
# 建立文件树
|
||
file_tree_struct = FileNode("root", build_manifest=True)
|
||
for file_path in file_manifest:
|
||
file_tree_struct.add_file(file_path, file_path)
|
||
|
||
# <第一步,逐个文件分析,多线程>
|
||
lang = "" if not plugin_kwargs["use_chinese"] else " (you must use Chinese)"
|
||
for index, fp in enumerate(file_manifest):
|
||
# 读取文件
|
||
with open(fp, 'r', encoding='utf-8', errors='replace') as f:
|
||
file_content = f.read()
|
||
prefix = ""
|
||
i_say = prefix + f'Please conclude the following source code at {os.path.relpath(fp, project_folder)} with only one sentence{lang}, the code is:\n```{file_content}```'
|
||
i_say_show_user = prefix + f'[{index+1}/{len(file_manifest)}] 请用一句话对下面的程序文件做一个整体概述: {fp}'
|
||
# 装载请求内容
|
||
MAX_TOKEN_SINGLE_FILE = 2560
|
||
i_say, _ = input_clipping(inputs=i_say, history=[], max_token_limit=MAX_TOKEN_SINGLE_FILE)
|
||
inputs_array.append(i_say)
|
||
inputs_show_user_array.append(i_say_show_user)
|
||
history_array.append([])
|
||
sys_prompt_array.append(f"You are a software architecture analyst analyzing a source code project. Do not dig into details, tell me what the code is doing in general. Your answer must be short, simple and clear{lang}.")
|
||
# 文件读取完成,对每一个源代码文件,生成一个请求线程,发送到大模型进行分析
|
||
gpt_response_collection = yield from request_gpt_model_multi_threads_with_very_awesome_ui_and_high_efficiency(
|
||
inputs_array = inputs_array,
|
||
inputs_show_user_array = inputs_show_user_array,
|
||
history_array = history_array,
|
||
sys_prompt_array = sys_prompt_array,
|
||
llm_kwargs = llm_kwargs,
|
||
chatbot = chatbot,
|
||
show_user_at_complete = True
|
||
)
|
||
|
||
# <第二步,逐个文件分析,生成带注释文件>
|
||
tasks = ["" for _ in range(len(file_manifest))]
|
||
def bark_fn(tasks):
|
||
for i in range(len(tasks)): tasks[i] = "watchdog is dead"
|
||
wd = WatchDog(timeout=10, bark_fn=lambda: bark_fn(tasks), interval=3, msg="ThreadWatcher timeout")
|
||
wd.begin_watch()
|
||
from concurrent.futures import ThreadPoolExecutor
|
||
executor = ThreadPoolExecutor(max_workers=get_conf('DEFAULT_WORKER_NUM'))
|
||
def _task_multi_threading(i_say, gpt_say, fp, file_tree_struct, index):
|
||
language = 'Chinese' if plugin_kwargs["use_chinese"] else 'English'
|
||
def observe_window_update(x):
|
||
if tasks[index] == "watchdog is dead":
|
||
raise TimeoutError("ThreadWatcher: watchdog is dead")
|
||
tasks[index] = x
|
||
pcc = PythonCodeComment(llm_kwargs, plugin_kwargs, language=language, observe_window_update=observe_window_update)
|
||
pcc.read_file(path=fp, brief=gpt_say)
|
||
revised_path, revised_content = pcc.begin_comment_source_code(None, None)
|
||
file_tree_struct.manifest[fp].revised_path = revised_path
|
||
file_tree_struct.manifest[fp].revised_content = revised_content
|
||
# <将结果写回源文件>
|
||
with open(fp, 'w', encoding='utf-8') as f:
|
||
f.write(file_tree_struct.manifest[fp].revised_content)
|
||
# <生成对比html>
|
||
with open("crazy_functions/agent_fns/python_comment_compare.html", 'r', encoding='utf-8') as f:
|
||
html_template = f.read()
|
||
warp = lambda x: "```python\n\n" + x + "\n\n```"
|
||
from themes.theme import load_dynamic_theme
|
||
_, advanced_css, _, _ = load_dynamic_theme("Default")
|
||
html_template = html_template.replace("ADVANCED_CSS", advanced_css)
|
||
html_template = html_template.replace("REPLACE_CODE_FILE_LEFT", pcc.get_markdown_block_in_html(markdown_convertion_for_file(warp(pcc.original_content))))
|
||
html_template = html_template.replace("REPLACE_CODE_FILE_RIGHT", pcc.get_markdown_block_in_html(markdown_convertion_for_file(warp(revised_content))))
|
||
compare_html_path = fp + '.compare.html'
|
||
file_tree_struct.manifest[fp].compare_html = compare_html_path
|
||
with open(compare_html_path, 'w', encoding='utf-8') as f:
|
||
f.write(html_template)
|
||
tasks[index] = ""
|
||
|
||
chatbot.append([None, f"正在处理:"])
|
||
futures = []
|
||
index = 0
|
||
for i_say, gpt_say, fp in zip(gpt_response_collection[0::2], gpt_response_collection[1::2], file_manifest):
|
||
future = executor.submit(_task_multi_threading, i_say, gpt_say, fp, file_tree_struct, index)
|
||
index += 1
|
||
futures.append(future)
|
||
|
||
# <第三步,等待任务完成>
|
||
cnt = 0
|
||
while True:
|
||
cnt += 1
|
||
wd.feed()
|
||
time.sleep(3)
|
||
worker_done = [h.done() for h in futures]
|
||
remain = len(worker_done) - sum(worker_done)
|
||
|
||
# <展示已经完成的部分>
|
||
preview_html_list = []
|
||
for done, fp in zip(worker_done, file_manifest):
|
||
if not done: continue
|
||
if hasattr(file_tree_struct.manifest[fp], 'compare_html'):
|
||
preview_html_list.append(file_tree_struct.manifest[fp].compare_html)
|
||
else:
|
||
logger.error(f"文件: {fp} 的注释结果未能成功")
|
||
file_links = generate_file_link(preview_html_list)
|
||
|
||
yield from update_ui_latest_msg(
|
||
f"当前任务: <br/>{'<br/>'.join(tasks)}.<br/>" +
|
||
f"剩余源文件数量: {remain}.<br/>" +
|
||
f"已完成的文件: {sum(worker_done)}.<br/>" +
|
||
file_links +
|
||
"<br/>" +
|
||
''.join(['.']*(cnt % 10 + 1)
|
||
), chatbot=chatbot, history=history, delay=0)
|
||
yield from update_ui(chatbot=chatbot, history=[]) # 刷新界面
|
||
if all(worker_done):
|
||
executor.shutdown()
|
||
break
|
||
|
||
# <第四步,压缩结果>
|
||
zip_res = zip_result(project_folder)
|
||
promote_file_to_downloadzone(file=zip_res, chatbot=chatbot)
|
||
|
||
# <END>
|
||
chatbot.append((None, "所有源文件均已处理完毕。"))
|
||
yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
|
||
|
||
|
||
|
||
@CatchException
|
||
def 注释Python项目(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, user_request):
|
||
history = [] # 清空历史,以免输入溢出
|
||
plugin_kwargs["use_chinese"] = plugin_kwargs.get("use_chinese", False)
|
||
import glob, os
|
||
if os.path.exists(txt):
|
||
project_folder = txt
|
||
validate_path_safety(project_folder, chatbot.get_user())
|
||
else:
|
||
if txt == "": txt = '空空如也的输入栏'
|
||
report_exception(chatbot, history, a = f"解析项目: {txt}", b = f"找不到本地项目或无权访问: {txt}")
|
||
yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
|
||
return
|
||
file_manifest = [f for f in glob.glob(f'{project_folder}/**/*.py', recursive=True)]
|
||
if len(file_manifest) == 0:
|
||
report_exception(chatbot, history, a = f"解析项目: {txt}", b = f"找不到任何python文件: {txt}")
|
||
yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
|
||
return
|
||
|
||
yield from 注释源代码(file_manifest, project_folder, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt)
|