2025-08-05 17:49:23 +08:00
|
|
|
|
"""
|
|
|
|
|
|
仓库管理工具的工具函数
|
|
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
import asyncio
|
|
|
|
|
|
from pathlib import Path
|
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
from zhenxun.services.log import logger
|
|
|
|
|
|
|
|
|
|
|
|
from .config import LOG_COMMAND
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
async def check_git() -> bool:
|
|
|
|
|
|
"""
|
|
|
|
|
|
检查环境变量中是否存在 git
|
|
|
|
|
|
|
|
|
|
|
|
返回:
|
|
|
|
|
|
bool: 是否存在git命令
|
|
|
|
|
|
"""
|
|
|
|
|
|
try:
|
|
|
|
|
|
process = await asyncio.create_subprocess_shell(
|
|
|
|
|
|
"git --version",
|
|
|
|
|
|
stdout=asyncio.subprocess.PIPE,
|
|
|
|
|
|
stderr=asyncio.subprocess.PIPE,
|
|
|
|
|
|
)
|
|
|
|
|
|
stdout, _ = await process.communicate()
|
|
|
|
|
|
return bool(stdout)
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error("检查git命令失败", LOG_COMMAND, e=e)
|
|
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
async def clean_git(cwd: Path):
|
|
|
|
|
|
"""
|
|
|
|
|
|
清理git仓库
|
|
|
|
|
|
|
|
|
|
|
|
参数:
|
|
|
|
|
|
cwd: 工作目录
|
|
|
|
|
|
"""
|
|
|
|
|
|
await run_git_command("reset --hard", cwd)
|
|
|
|
|
|
await run_git_command("clean -xdf", cwd)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
async def run_git_command(
|
|
|
|
|
|
command: str, cwd: Path | None = None
|
|
|
|
|
|
) -> tuple[bool, str, str]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
运行git命令
|
|
|
|
|
|
|
|
|
|
|
|
参数:
|
|
|
|
|
|
command: 命令
|
|
|
|
|
|
cwd: 工作目录
|
|
|
|
|
|
|
|
|
|
|
|
返回:
|
|
|
|
|
|
tuple[bool, str, str]: (是否成功, 标准输出, 标准错误)
|
|
|
|
|
|
"""
|
|
|
|
|
|
try:
|
|
|
|
|
|
full_command = f"git {command}"
|
|
|
|
|
|
# 将Path对象转换为字符串
|
|
|
|
|
|
cwd_str = str(cwd) if cwd else None
|
|
|
|
|
|
process = await asyncio.create_subprocess_shell(
|
|
|
|
|
|
full_command,
|
|
|
|
|
|
stdout=asyncio.subprocess.PIPE,
|
|
|
|
|
|
stderr=asyncio.subprocess.PIPE,
|
|
|
|
|
|
cwd=cwd_str,
|
|
|
|
|
|
)
|
|
|
|
|
|
stdout_bytes, stderr_bytes = await process.communicate()
|
|
|
|
|
|
|
|
|
|
|
|
stdout = stdout_bytes.decode("utf-8").strip()
|
|
|
|
|
|
stderr = stderr_bytes.decode("utf-8").strip()
|
|
|
|
|
|
|
|
|
|
|
|
return process.returncode == 0, stdout, stderr
|
|
|
|
|
|
except Exception as e:
|
|
|
|
|
|
logger.error(f"运行git命令失败: {command}, 错误: {e}")
|
|
|
|
|
|
return False, "", str(e)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def glob_to_regex(pattern: str) -> str:
|
|
|
|
|
|
"""
|
|
|
|
|
|
将glob模式转换为正则表达式
|
|
|
|
|
|
|
|
|
|
|
|
参数:
|
|
|
|
|
|
pattern: glob模式,如 "*.py"
|
|
|
|
|
|
|
|
|
|
|
|
返回:
|
|
|
|
|
|
str: 正则表达式
|
|
|
|
|
|
"""
|
|
|
|
|
|
# 转义特殊字符
|
|
|
|
|
|
regex = re.escape(pattern)
|
|
|
|
|
|
|
|
|
|
|
|
# 替换glob通配符
|
|
|
|
|
|
regex = regex.replace(r"\*\*", ".*") # ** -> .*
|
|
|
|
|
|
regex = regex.replace(r"\*", "[^/]*") # * -> [^/]*
|
|
|
|
|
|
regex = regex.replace(r"\?", "[^/]") # ? -> [^/]
|
|
|
|
|
|
|
|
|
|
|
|
# 添加开始和结束标记
|
|
|
|
|
|
regex = f"^{regex}$"
|
|
|
|
|
|
|
|
|
|
|
|
return regex
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def filter_files(
|
|
|
|
|
|
files: list[str],
|
|
|
|
|
|
include_patterns: list[str] | None = None,
|
|
|
|
|
|
exclude_patterns: list[str] | None = None,
|
|
|
|
|
|
) -> list[str]:
|
|
|
|
|
|
"""
|
|
|
|
|
|
过滤文件列表
|
|
|
|
|
|
|
|
|
|
|
|
参数:
|
|
|
|
|
|
files: 文件列表
|
|
|
|
|
|
include_patterns: 包含的文件模式列表,如 ["*.py", "docs/*.md"]
|
|
|
|
|
|
exclude_patterns: 排除的文件模式列表,如 ["__pycache__/*", "*.pyc"]
|
|
|
|
|
|
|
|
|
|
|
|
返回:
|
|
|
|
|
|
list[str]: 过滤后的文件列表
|
|
|
|
|
|
"""
|
|
|
|
|
|
result = files.copy()
|
|
|
|
|
|
|
|
|
|
|
|
# 应用包含模式
|
|
|
|
|
|
if include_patterns:
|
|
|
|
|
|
included = []
|
|
|
|
|
|
for pattern in include_patterns:
|
|
|
|
|
|
regex_pattern = glob_to_regex(pattern)
|
|
|
|
|
|
included.extend(file for file in result if re.match(regex_pattern, file))
|
|
|
|
|
|
result = included
|
|
|
|
|
|
|
|
|
|
|
|
# 应用排除模式
|
|
|
|
|
|
if exclude_patterns:
|
|
|
|
|
|
for pattern in exclude_patterns:
|
|
|
|
|
|
regex_pattern = glob_to_regex(pattern)
|
|
|
|
|
|
result = [file for file in result if not re.match(regex_pattern, file)]
|
|
|
|
|
|
|
|
|
|
|
|
return result
|
2025-08-26 18:01:32 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
async def sparse_checkout_clone(
|
|
|
|
|
|
repo_url: str,
|
|
|
|
|
|
branch: str,
|
|
|
|
|
|
sparse_path: str,
|
|
|
|
|
|
target_dir: Path,
|
|
|
|
|
|
) -> None:
|
|
|
|
|
|
"""
|
|
|
|
|
|
使用 git 稀疏检出克隆指定路径到目标目录(完全独立于主项目 git)。
|
|
|
|
|
|
|
|
|
|
|
|
关键保障:
|
|
|
|
|
|
- 在 target_dir 下检测/初始化 .git,所有 git 操作均以 cwd=target_dir 执行
|
|
|
|
|
|
- 强制拉取与工作区覆盖: fetch --force、checkout -B、reset --hard、clean -xdf
|
|
|
|
|
|
- 反复设置 sparse-checkout 路径,确保路径更新生效
|
|
|
|
|
|
"""
|
|
|
|
|
|
target_dir.mkdir(parents=True, exist_ok=True)
|
|
|
|
|
|
|
|
|
|
|
|
if not await check_git():
|
|
|
|
|
|
raise RuntimeError("未检测到可用的 git 命令")
|
|
|
|
|
|
|
|
|
|
|
|
git_dir = target_dir / ".git"
|
|
|
|
|
|
if not git_dir.exists():
|
|
|
|
|
|
success, out, err = await run_git_command("init", target_dir)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
raise RuntimeError(f"git init 失败: {err or out}")
|
|
|
|
|
|
success, out, err = await run_git_command(
|
|
|
|
|
|
f"remote add origin {repo_url}", target_dir
|
|
|
|
|
|
)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
raise RuntimeError(f"添加远程失败: {err or out}")
|
|
|
|
|
|
else:
|
|
|
|
|
|
success, out, err = await run_git_command(
|
|
|
|
|
|
f"remote set-url origin {repo_url}", target_dir
|
|
|
|
|
|
)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
# 兜底尝试添加
|
|
|
|
|
|
await run_git_command(f"remote add origin {repo_url}", target_dir)
|
|
|
|
|
|
|
|
|
|
|
|
# 启用稀疏检出(重复设置以确保幂等)
|
|
|
|
|
|
await run_git_command("config core.sparseCheckout true", target_dir)
|
|
|
|
|
|
await run_git_command("sparse-checkout init --cone", target_dir)
|
|
|
|
|
|
|
|
|
|
|
|
# 设置需要检出的路径(每次都覆盖配置)
|
|
|
|
|
|
if not sparse_path:
|
|
|
|
|
|
raise RuntimeError("sparse-checkout 路径不能为空")
|
|
|
|
|
|
success, out, err = await run_git_command(
|
|
|
|
|
|
f"sparse-checkout set {sparse_path}", target_dir
|
|
|
|
|
|
)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
raise RuntimeError(f"配置稀疏路径失败: {err or out}")
|
|
|
|
|
|
|
|
|
|
|
|
# 强制拉取并同步到远端
|
|
|
|
|
|
success, out, err = await run_git_command(
|
|
|
|
|
|
f"fetch --force --depth 1 origin {branch}", target_dir
|
|
|
|
|
|
)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
raise RuntimeError(f"fetch 失败: {err or out}")
|
|
|
|
|
|
|
|
|
|
|
|
# 使用远端强制更新本地分支并覆盖工作区
|
|
|
|
|
|
success, out, err = await run_git_command(
|
|
|
|
|
|
f"checkout -B {branch} origin/{branch}", target_dir
|
|
|
|
|
|
)
|
|
|
|
|
|
if not success:
|
|
|
|
|
|
# 回退方案
|
|
|
|
|
|
success2, out2, err2 = await run_git_command(f"checkout {branch}", target_dir)
|
|
|
|
|
|
if not success2:
|
|
|
|
|
|
raise RuntimeError(f"checkout 失败: {(err or out) or (err2 or out2)}")
|
|
|
|
|
|
|
|
|
|
|
|
# 强制对齐工作区
|
|
|
|
|
|
await run_git_command(f"reset --hard origin/{branch}", target_dir)
|
|
|
|
|
|
await run_git_command("clean -xdf", target_dir)
|