""" 仓库管理工具的工具函数 """ import asyncio from pathlib import Path import re from zhenxun.services.log import logger from .config import LOG_COMMAND async def check_git() -> bool: """ 检查环境变量中是否存在 git 返回: bool: 是否存在git命令 """ try: process = await asyncio.create_subprocess_shell( "git --version", stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE, ) stdout, _ = await process.communicate() return bool(stdout) except Exception as e: logger.error("检查git命令失败", LOG_COMMAND, e=e) return False async def clean_git(cwd: Path): """ 清理git仓库 参数: cwd: 工作目录 """ await run_git_command("reset --hard", cwd) await run_git_command("clean -xdf", cwd) async def run_git_command( command: str, cwd: Path | None = None ) -> tuple[bool, str, str]: """ 运行git命令 参数: command: 命令 cwd: 工作目录 返回: tuple[bool, str, str]: (是否成功, 标准输出, 标准错误) """ try: full_command = f"git {command}" # 将Path对象转换为字符串 cwd_str = str(cwd) if cwd else None process = await asyncio.create_subprocess_shell( full_command, stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE, cwd=cwd_str, ) stdout_bytes, stderr_bytes = await process.communicate() stdout = stdout_bytes.decode("utf-8").strip() stderr = stderr_bytes.decode("utf-8").strip() return process.returncode == 0, stdout, stderr except Exception as e: logger.error(f"运行git命令失败: {command}, 错误: {e}") return False, "", str(e) def glob_to_regex(pattern: str) -> str: """ 将glob模式转换为正则表达式 参数: pattern: glob模式,如 "*.py" 返回: str: 正则表达式 """ # 转义特殊字符 regex = re.escape(pattern) # 替换glob通配符 regex = regex.replace(r"\*\*", ".*") # ** -> .* regex = regex.replace(r"\*", "[^/]*") # * -> [^/]* regex = regex.replace(r"\?", "[^/]") # ? -> [^/] # 添加开始和结束标记 regex = f"^{regex}$" return regex def filter_files( files: list[str], include_patterns: list[str] | None = None, exclude_patterns: list[str] | None = None, ) -> list[str]: """ 过滤文件列表 参数: files: 文件列表 include_patterns: 包含的文件模式列表,如 ["*.py", "docs/*.md"] exclude_patterns: 排除的文件模式列表,如 ["__pycache__/*", "*.pyc"] 返回: list[str]: 过滤后的文件列表 """ result = files.copy() # 应用包含模式 if include_patterns: included = [] for pattern in include_patterns: regex_pattern = glob_to_regex(pattern) included.extend(file for file in result if re.match(regex_pattern, file)) result = included # 应用排除模式 if exclude_patterns: for pattern in exclude_patterns: regex_pattern = glob_to_regex(pattern) result = [file for file in result if not re.match(regex_pattern, file)] return result async def sparse_checkout_clone( repo_url: str, branch: str, sparse_path: str, target_dir: Path, ) -> None: """ 使用 git 稀疏检出克隆指定路径到目标目录(完全独立于主项目 git)。 关键保障: - 在 target_dir 下检测/初始化 .git,所有 git 操作均以 cwd=target_dir 执行 - 强制拉取与工作区覆盖: fetch --force、checkout -B、reset --hard、clean -xdf - 反复设置 sparse-checkout 路径,确保路径更新生效 """ target_dir.mkdir(parents=True, exist_ok=True) if not await check_git(): raise RuntimeError("未检测到可用的 git 命令") git_dir = target_dir / ".git" if not git_dir.exists(): success, out, err = await run_git_command("init", target_dir) if not success: raise RuntimeError(f"git init 失败: {err or out}") success, out, err = await run_git_command( f"remote add origin {repo_url}", target_dir ) if not success: raise RuntimeError(f"添加远程失败: {err or out}") else: success, out, err = await run_git_command( f"remote set-url origin {repo_url}", target_dir ) if not success: # 兜底尝试添加 await run_git_command(f"remote add origin {repo_url}", target_dir) # 启用稀疏检出(重复设置以确保幂等) await run_git_command("config core.sparseCheckout true", target_dir) await run_git_command("sparse-checkout init --cone", target_dir) # 设置需要检出的路径(每次都覆盖配置) if not sparse_path: raise RuntimeError("sparse-checkout 路径不能为空") success, out, err = await run_git_command( f"sparse-checkout set {sparse_path}", target_dir ) if not success: raise RuntimeError(f"配置稀疏路径失败: {err or out}") # 强制拉取并同步到远端 success, out, err = await run_git_command( f"fetch --force --depth 1 origin {branch}", target_dir ) if not success: raise RuntimeError(f"fetch 失败: {err or out}") # 使用远端强制更新本地分支并覆盖工作区 success, out, err = await run_git_command( f"checkout -B {branch} origin/{branch}", target_dir ) if not success: # 回退方案 success2, out2, err2 = await run_git_command(f"checkout {branch}", target_dir) if not success2: raise RuntimeError(f"checkout 失败: {(err or out) or (err2 or out2)}") # 强制对齐工作区 await run_git_command(f"reset --hard origin/{branch}", target_dir) await run_git_command("clean -xdf", target_dir)