mirror of
https://github.com/zhenxun-org/zhenxun_bot.git
synced 2025-12-15 14:22:55 +08:00
208 lines
6.0 KiB
Python
208 lines
6.0 KiB
Python
"""
|
||
仓库管理工具的工具函数
|
||
"""
|
||
|
||
import asyncio
|
||
from pathlib import Path
|
||
import re
|
||
|
||
from zhenxun.services.log import logger
|
||
|
||
from .config import LOG_COMMAND
|
||
|
||
|
||
async def check_git() -> bool:
|
||
"""
|
||
检查环境变量中是否存在 git
|
||
|
||
返回:
|
||
bool: 是否存在git命令
|
||
"""
|
||
try:
|
||
process = await asyncio.create_subprocess_shell(
|
||
"git --version",
|
||
stdout=asyncio.subprocess.PIPE,
|
||
stderr=asyncio.subprocess.PIPE,
|
||
)
|
||
stdout, _ = await process.communicate()
|
||
return bool(stdout)
|
||
except Exception as e:
|
||
logger.error("检查git命令失败", LOG_COMMAND, e=e)
|
||
return False
|
||
|
||
|
||
async def clean_git(cwd: Path):
|
||
"""
|
||
清理git仓库
|
||
|
||
参数:
|
||
cwd: 工作目录
|
||
"""
|
||
await run_git_command("reset --hard", cwd)
|
||
await run_git_command("clean -xdf", cwd)
|
||
|
||
|
||
async def run_git_command(
|
||
command: str, cwd: Path | None = None
|
||
) -> tuple[bool, str, str]:
|
||
"""
|
||
运行git命令
|
||
|
||
参数:
|
||
command: 命令
|
||
cwd: 工作目录
|
||
|
||
返回:
|
||
tuple[bool, str, str]: (是否成功, 标准输出, 标准错误)
|
||
"""
|
||
try:
|
||
full_command = f"git {command}"
|
||
# 将Path对象转换为字符串
|
||
cwd_str = str(cwd) if cwd else None
|
||
process = await asyncio.create_subprocess_shell(
|
||
full_command,
|
||
stdout=asyncio.subprocess.PIPE,
|
||
stderr=asyncio.subprocess.PIPE,
|
||
cwd=cwd_str,
|
||
)
|
||
stdout_bytes, stderr_bytes = await process.communicate()
|
||
|
||
stdout = stdout_bytes.decode("utf-8").strip()
|
||
stderr = stderr_bytes.decode("utf-8").strip()
|
||
|
||
return process.returncode == 0, stdout, stderr
|
||
except Exception as e:
|
||
logger.error(f"运行git命令失败: {command}, 错误: {e}")
|
||
return False, "", str(e)
|
||
|
||
|
||
def glob_to_regex(pattern: str) -> str:
|
||
"""
|
||
将glob模式转换为正则表达式
|
||
|
||
参数:
|
||
pattern: glob模式,如 "*.py"
|
||
|
||
返回:
|
||
str: 正则表达式
|
||
"""
|
||
# 转义特殊字符
|
||
regex = re.escape(pattern)
|
||
|
||
# 替换glob通配符
|
||
regex = regex.replace(r"\*\*", ".*") # ** -> .*
|
||
regex = regex.replace(r"\*", "[^/]*") # * -> [^/]*
|
||
regex = regex.replace(r"\?", "[^/]") # ? -> [^/]
|
||
|
||
# 添加开始和结束标记
|
||
regex = f"^{regex}$"
|
||
|
||
return regex
|
||
|
||
|
||
def filter_files(
|
||
files: list[str],
|
||
include_patterns: list[str] | None = None,
|
||
exclude_patterns: list[str] | None = None,
|
||
) -> list[str]:
|
||
"""
|
||
过滤文件列表
|
||
|
||
参数:
|
||
files: 文件列表
|
||
include_patterns: 包含的文件模式列表,如 ["*.py", "docs/*.md"]
|
||
exclude_patterns: 排除的文件模式列表,如 ["__pycache__/*", "*.pyc"]
|
||
|
||
返回:
|
||
list[str]: 过滤后的文件列表
|
||
"""
|
||
result = files.copy()
|
||
|
||
# 应用包含模式
|
||
if include_patterns:
|
||
included = []
|
||
for pattern in include_patterns:
|
||
regex_pattern = glob_to_regex(pattern)
|
||
included.extend(file for file in result if re.match(regex_pattern, file))
|
||
result = included
|
||
|
||
# 应用排除模式
|
||
if exclude_patterns:
|
||
for pattern in exclude_patterns:
|
||
regex_pattern = glob_to_regex(pattern)
|
||
result = [file for file in result if not re.match(regex_pattern, file)]
|
||
|
||
return result
|
||
|
||
|
||
async def sparse_checkout_clone(
|
||
repo_url: str,
|
||
branch: str,
|
||
sparse_path: str,
|
||
target_dir: Path,
|
||
) -> None:
|
||
"""
|
||
使用 git 稀疏检出克隆指定路径到目标目录(完全独立于主项目 git)。
|
||
|
||
关键保障:
|
||
- 在 target_dir 下检测/初始化 .git,所有 git 操作均以 cwd=target_dir 执行
|
||
- 强制拉取与工作区覆盖: fetch --force、checkout -B、reset --hard、clean -xdf
|
||
- 反复设置 sparse-checkout 路径,确保路径更新生效
|
||
"""
|
||
target_dir.mkdir(parents=True, exist_ok=True)
|
||
|
||
if not await check_git():
|
||
raise RuntimeError("未检测到可用的 git 命令")
|
||
|
||
git_dir = target_dir / ".git"
|
||
if not git_dir.exists():
|
||
success, out, err = await run_git_command("init", target_dir)
|
||
if not success:
|
||
raise RuntimeError(f"git init 失败: {err or out}")
|
||
success, out, err = await run_git_command(
|
||
f"remote add origin {repo_url}", target_dir
|
||
)
|
||
if not success:
|
||
raise RuntimeError(f"添加远程失败: {err or out}")
|
||
else:
|
||
success, out, err = await run_git_command(
|
||
f"remote set-url origin {repo_url}", target_dir
|
||
)
|
||
if not success:
|
||
# 兜底尝试添加
|
||
await run_git_command(f"remote add origin {repo_url}", target_dir)
|
||
|
||
# 启用稀疏检出(重复设置以确保幂等)
|
||
await run_git_command("config core.sparseCheckout true", target_dir)
|
||
await run_git_command("sparse-checkout init --cone", target_dir)
|
||
|
||
# 设置需要检出的路径(每次都覆盖配置)
|
||
if not sparse_path:
|
||
raise RuntimeError("sparse-checkout 路径不能为空")
|
||
success, out, err = await run_git_command(
|
||
f"sparse-checkout set {sparse_path}", target_dir
|
||
)
|
||
if not success:
|
||
raise RuntimeError(f"配置稀疏路径失败: {err or out}")
|
||
|
||
# 强制拉取并同步到远端
|
||
success, out, err = await run_git_command(
|
||
f"fetch --force --depth 1 origin {branch}", target_dir
|
||
)
|
||
if not success:
|
||
raise RuntimeError(f"fetch 失败: {err or out}")
|
||
|
||
# 使用远端强制更新本地分支并覆盖工作区
|
||
success, out, err = await run_git_command(
|
||
f"checkout -B {branch} origin/{branch}", target_dir
|
||
)
|
||
if not success:
|
||
# 回退方案
|
||
success2, out2, err2 = await run_git_command(f"checkout {branch}", target_dir)
|
||
if not success2:
|
||
raise RuntimeError(f"checkout 失败: {(err or out) or (err2 or out2)}")
|
||
|
||
# 强制对齐工作区
|
||
await run_git_command(f"reset --hard origin/{branch}", target_dir)
|
||
await run_git_command("clean -xdf", target_dir)
|