mrhblfx commited on
Commit
9b5f088
1 Parent(s): 3a561a7

Changed matching rules

Browse files
crazy_functions/解析项目源代码.py CHANGED
@@ -268,19 +268,22 @@ def 解析一个CSharp项目(txt, llm_kwargs, plugin_kwargs, chatbot, history, s
268
 
269
  @CatchException
270
  def 解析任意code项目(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, web_port):
271
- txt_include = plugin_kwargs.get("txt_include")
272
- txt_except = plugin_kwargs.get("txt_except")
273
- # 将要匹配的后缀
274
- pattern_include = [_.lstrip(" .,,").rstrip(" ,,") for _ in txt_include.split(" ") if _ != ""]
275
- pattern_include = [_.lstrip(" .,,").rstrip(" ,,") for __ in pattern_include for _ in __.split(",") if _ != ""]
276
- pattern_include = [_.lstrip(" .,,").rstrip(" ,,") for __ in pattern_include for _ in __.split(",") if _ != ""]
277
- # 将要忽略匹配的后缀
278
- pattern_except = [_.lstrip(" .,,").rstrip(" ,,") for _ in txt_except.split(" ") if _ != ""]
279
- pattern_except = [_.lstrip(" .,,").rstrip(" ,,") for __ in pattern_except for _ in __.split(",") if _ != ""]
280
- pattern_except = [_.lstrip(" .,,").rstrip(" ,,") for __ in pattern_except for _ in __.split("") if _ != ""]
281
- pattern_except += ['zip', 'rar', '7z', 'tar', 'gz'] # 避免解析上传的压缩文件
282
- history = [] # 清空历史,以免输入溢出
283
- import glob, os
 
 
 
284
  if os.path.exists(txt):
285
  project_folder = txt
286
  else:
@@ -288,8 +291,13 @@ def 解析任意code项目(txt, llm_kwargs, plugin_kwargs, chatbot, history, sys
288
  report_execption(chatbot, history, a = f"解析项目: {txt}", b = f"找不到本地项目或无权访问: {txt}")
289
  yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
290
  return
291
- file_manifest = [f for f in glob.glob(f'{project_folder}/**/*.*', recursive=True) if os.path.isfile(f) and \
292
- ([] == pattern_include or f.split(".")[-1] in pattern_include) and f.split(".")[-1] not in pattern_except]
 
 
 
 
 
293
  if len(file_manifest) == 0:
294
  report_execption(chatbot, history, a = f"解析项目: {txt}", b = f"找不到任何文件: {txt}")
295
  yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
 
268
 
269
  @CatchException
270
  def 解析任意code项目(txt, llm_kwargs, plugin_kwargs, chatbot, history, system_prompt, web_port):
271
+ txt_pattern = plugin_kwargs.get("txt_pattern")
272
+ txt_pattern = txt_pattern.replace("", ",")
273
+ # 将要匹配的模式(例如: *.c, *.cpp, *.py, config.toml)
274
+ pattern_include = [_.lstrip(" ,").rstrip(" ,") for _ in txt_pattern.split(",") if _ != "" and not _.strip().startswith("^")]
275
+ if not pattern_include: pattern_include = ["*"] # 不输入即全部匹配
276
+ # 将要忽略匹配的文件后缀(例如: ^*.c, ^*.cpp, ^*.py)
277
+ pattern_except_suffix = [_.lstrip(" ^*.,").rstrip(" ,") for _ in txt_pattern.split(" ") if _ != "" and _.strip().startswith("^*.")]
278
+ pattern_except_suffix += ['zip', 'rar', '7z', 'tar', 'gz'] # 避免解析压缩文件
279
+ # 将要忽略匹配的文件名(例如: ^README.md)
280
+ pattern_except_name = [_.lstrip(" ^*,").rstrip(" ,").replace(".", "\.") for _ in txt_pattern.split(" ") if _ != "" and _.strip().startswith("^") and not _.strip().startswith("^*.")]
281
+ # 生成正则表达式
282
+ pattern_except = '/[^/]+\.(' + "|".join(pattern_except_suffix) + ')$'
283
+ pattern_except += '|/(' + "|".join(pattern_except_name) + ')$' if pattern_except_name != [] else ''
284
+
285
+ history.clear()
286
+ import glob, os, re
287
  if os.path.exists(txt):
288
  project_folder = txt
289
  else:
 
291
  report_execption(chatbot, history, a = f"解析项目: {txt}", b = f"找不到本地项目或无权访问: {txt}")
292
  yield from update_ui(chatbot=chatbot, history=history) # 刷新界面
293
  return
294
+ # 若上传压缩文件, 先寻找到解压的文件夹路径, 从而避免解析压缩文件
295
+ maybe_dir = [f for f in glob.glob(f'{project_folder}/**') if os.path.isdir(f)]
296
+ extract_folder_path = maybe_dir[0].replace('\\', '/') if len(maybe_dir) != 0 else ""
297
+ # 按输入的匹配模式寻找上传的非压缩文件和已解压的文件
298
+ file_manifest = [f for f in glob.glob(f'{project_folder}/**') if os.path.isfile(f) and not re.search(pattern_except, f)] + \
299
+ [f for _ in pattern_include for f in glob.glob(f'{extract_folder_path}/**/{_}', recursive=True) if \
300
+ "" != extract_folder_path and os.path.isfile(f) and not re.search(pattern_except, f)]
301
  if len(file_manifest) == 0:
302
  report_execption(chatbot, history, a = f"解析项目: {txt}", b = f"找不到任何文件: {txt}")
303
  yield from update_ui(chatbot=chatbot, history=history) # 刷新界面