diff --git a/test/common/doc/EnvPreCheck.md b/test/common/doc/EnvPreCheck.md
new file mode 100644
index 000000000..ffca6b3b8
--- /dev/null
+++ b/test/common/doc/EnvPreCheck.md
@@ -0,0 +1,123 @@
+# 环境预检（Environment PreCheck）自动化测试套件
+
+基于 pytest 的环境预检自动化测试，用于在大规模训练或推理任务执行前，对集群环境的关键能力进行全面验证。该预检流程覆盖 SSH 连通性、设备健康状态、节点间通信、TLS 配置、模型权重完整性以及存储带宽等关键组件，确保集群处于可用且一致的运行状态。
+
+# 测试框架具备以下特性：
+
+1、针对 NPU（Ascend）/ GPU 自动识别执行相应测试
+
+2、所有测试项均动态输出，便于快速识别检测
+
+3、全面覆盖环境依赖的核心组件
+
+
+# 功能概述
+
+本测试套件在模型部署或训练前自动执行以下预检内容：
+
+✔ SSH 登录能力检查：确保 Master/Worker 的免密登录配置正确。
+
+✔ 设备状态检查（NPU / GPU）：检测各节点的设备是否在线、驱动是否正常。
+
+✔ 节点间 Ping 连通性检查：验证 HCCN（NPU）或 NVIDIA（GPU）网络链路是否可达、是否存在丢包或故障链路。
+
+✔ TLS 配置检查：检查 Ascend 集群中设备间 TLS 加密链路开关状态。
+
+✔ 模型权重完整性检查：包括权重文件列表扫描、哈希值校验和权重有效性验证
+
+✔ 存储点带宽检查：检查 embedding / fetch 操作带宽，并与配置文件中的限制进行比较。
+
+
+# 🚀 ###########如何运行测试（test/下执行）#############
+# 目录结构说明
+├── tests/
+├── common/
+│   └── envPreCheck/
+│       ├── run_env_preCheck.py # 所有检查逻辑
+│       └── ...
+├── suites
+│   └── E2E/
+│       ├── test_environment_precheck.py # 执行逻辑
+│       └── ...
+├── config.yaml                  # 预检的阈值配置
+
+# 运行完整的阶段预检
+pytest --stage=2
+
+# 按平台运行预检（公共检测项默认NPU平台）
+# NPU环境
+pytest --platform=npu
+# GPU环境
+pytest --platform=gpu
+
+# 按特性类别运行
+pytest --feature=test_ssh_login
+
+# 按文件运行
+pytest suites/E2E/test_environment_precheck.py
+
+
+# 🛠️ #########以下为各测试的示例说明##########
+# ● SSH 登录检查：
+test_ssh_login()
+校验 master/worker SSH 免密登录
+
+任何失败将立即中止后续测试
+
+# ● 设备状态检查（NPU/GPU）
+test_hccn_check_device_status()
+test_nvidia_check_device_status()
+
+检查设备是否在线、是否可用
+
+# ● HCCN / NVIDIA Ping 连通性检查
+test_check_hccn_ping()
+test_check_nvidia_ping()
+
+生成所有链路状态信息，例如：
+
+local_card_0 → local_card_1
+
+local_card_0 → remote_IP
+
+remote_card_1 → local_IP
+
+# ● TLS 开关检查
+test_check_tls()
+
+校验每张卡的tls switch是否为0
+
+# ● 模型权重完整性检查
+test_check_model_weights()
+
+权重文件列表扫描、哈希值校验和权重有效性验证
+
+# ● 存储带宽检测
+test_check_bandwidth()
+
+检查存储实际待遇是否达到预期带宽：实际 bandwidth < 阈值 * 0.85，否则判定为异常
+
+
+# ⚙️##########配置项说明（config.yaml）##########
+master_ip：集群主节点（Master）的 SSH 登录 IP，用于执行预检中的主节点检查。
+
+worker_ip：集群工作节点（Worker）的 IP 地址，用于检测 Worker 的设备状态、网络连通性等。
+
+ascend_rt_visible_devices：设置 Ascend/NPU 的可见设备序号，用于设备状态和带宽测试。
+
+node_num：集群节点数量，用于预检逻辑判断是否需要跨节点检查。
+
+model_path：模型权重所在目录，用于权重文件检查和哈希校验。
+
+hf_model_name：Hugging Face 模型名称，用于识别模型类型与路径结构。
+
+middle_page：模型对应的中间页面/组织名称，用于存储结构或路径判断
+
+expected_embed_bandwidth：预期 embedding 带宽（GB/s），用于对比实际带宽是否满足阈值。
+
+expected_fetch_bandwidth：预期 fetch 带宽（GB/s），与实际带宽比较判断读写性能是否正常。
+
+kvCache_block_number：KV Cache 预分配 block 数量，用于环境容量检查或推理配置校验。
+
+storage_backends：存储后端挂载路径，用于带宽测试和路径可用性检查。
+将这些内容复制打出来
\ No newline at end of file
diff --git a/test/common/doc/LLMPerf.md b/test/common/doc/LLMPerf.md
new file mode 100644
index 000000000..8210bb8e2
--- /dev/null
+++ b/test/common/doc/LLMPerf.md
@@ -0,0 +1,68 @@
+# 📝 LLM 性能测试使用说明
+
+## 🔧 功能概述  
+本测试用于评估 LLM 推理服务在不同负载下的性能表现，涵盖延迟、吞吐量、请求成功率等关键指标。
+
+## 📌 测试参数说明
+
+| 参数 | 说明 | 示例 |
+|------|------|------|
+| `mean_input_tokens` | 平均输入 token 数 | `[2000, 3000]` |
+| `mean_output_tokens` | 平均输出 token 数 | `[200, 500]` |
+| `max_num_completed_requests` | 最大完成请求数 | `[8, 4]` |
+| `concurrent_requests` | 并发请求数 | `[8, 4]` |
+| `additional_sampling_params` | 额外采样参数（如 temperature） | `["{}", "{}"]` |
+| `hit_rate` | 缓存命中率 | `[0, 50]` |
+
+> ✅ 支持多组参数组合运行，自动执行多轮推理并收集统计结果。
+
+## 📊 输出结果
+
+测试完成后，将输出以下性能指标的统计值（每轮结果均记录）：
+
+- **延迟指标**：  
+  - `inter_token_latency_s`（token 间延迟）  
+  - `ttft_s`（首个 token 延迟）  
+  - `end_to_end_latency_s`（端到端延迟）  
+  - 各项包含：P50、P90、P99、平均值
+
+- **吞吐量指标**：  
+  - `total_throughput`（总吞吐量）  
+  - `incremental_throughput`（增量吞吐量）
+
+- **其他指标**：  
+  - `num_completed_requests`（完成请求数）  
+  - `elapsed_time`（总耗时）  
+  - `incremental_time_delay`（增量时间延迟）
+
+## ✅ 验证规则
+
+- 所有数值必须 > 0
+- 若出现 `None` 或 ≤ 0 的值，测试将标记为失败，并输出异常详情
+
+## 📤 输出格式
+
+返回一个字典，包含：
+```python
+{
+    "_name": "llmperf",
+    "_data": {  # 所有指标的列表
+        "results_inter_token_latency_s_quantiles_p50": [...],
+        "results_ttft_s_mean": [...],
+        # ...
+    }
+}
+```
+
+## 🚀 使用方式 test/下运行
+
+# 按文件运行
+pytest test_uc_performance.py
+
+# 按阶段运行
+pytest --stage=0
+
+# 按特性运行
+pytest --feature=uc_performance_test
+
+> ⚠️ 确保已安装依赖：`pytest` 等模块。
\ No newline at end of file
diff --git a/test/common/envPreCheck/__init__.py b/test/common/envPreCheck/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/test/common/envPreCheck/run_env_preCheck.py b/test/common/envPreCheck/run_env_preCheck.py
new file mode 100644
index 000000000..f99b87952
--- /dev/null
+++ b/test/common/envPreCheck/run_env_preCheck.py
@@ -0,0 +1,1395 @@
+import os
+import re
+import secrets
+import shlex
+import subprocess
+import sys
+import threading
+import time
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple
+
+import ucmstore
+import yaml
+
+CODE_ROOT = Path(__file__).resolve().parent
+Custom_SSH_DIR = (CODE_ROOT / "ssh_keys").resolve()
+Custom_SSH_DIR.mkdir(parents=True, exist_ok=True)
+
+LOCAL_SSH_KEY = Custom_SSH_DIR / "id_rsa"
+LOCAL_SSH_KEY_PUB = Custom_SSH_DIR / "id_rsa.pub"
+
+config_file = Path(__file__).parent.parent.parent / "config.yaml"
+with open(config_file, "r", encoding="utf-8") as f:
+    config = yaml.safe_load(f)
+    MASTER_IP = config.get("Env_preCheck", {}).get("master_ip", "")
+    WORKER_IP = config.get("Env_preCheck", {}).get("worker_ip", "")
+    ASCEND_RT_VISIBLE_DEVICES = config.get("Env_preCheck", {}).get(
+        "ascend_rt_visible_devices", ""
+    )
+    NODE_NUM = config.get("Env_preCheck", {}).get("node_num", "")
+    MODEL_PATH = config.get("Env_preCheck", {}).get("model_path", "")
+    HF_MODEL_NAME = config.get("Env_preCheck", {}).get("hf_model_name", "")
+    MIDDLE_PAGE = config.get("Env_preCheck", {}).get("middle_page", "")
+
+    KVCACHE_BLOCK_NUMBER = config.get("Env_preCheck", {}).get(
+        "kvCache_block_number", ""
+    )
+    STORAGE_BACKENDS = config.get("Env_preCheck", {}).get("storage_backends", "")
+
+
+def run_command(
+    cmd: List[str], check: bool = True, timeout: Optional[int] = None
+) -> Tuple[int, str, str]:
+    """
+    Execute a command and return (return_code, stdout, stderr).
+
+    Args:
+        cmd: List of command arguments.
+        check: If True, raise an exception on non-zero return code.
+        timeout: Maximum time (in seconds) to wait for command completion.
+                 If None, no timeout is applied.
+
+    Returns:
+        A tuple containing:
+        - return_code: Exit code of the command.
+        - stdout: Captured standard output.
+        - stderr: Captured standard error.
+
+    Raises:
+        subprocess.TimeoutExpired: If the command times out.
+        Exception: For any other unexpected error.
+    """
+    try:
+        result = subprocess.run(cmd, capture_output=True, text=True, timeout=timeout)
+        return result.returncode, result.stdout, result.stderr
+    except subprocess.TimeoutExpired:
+        return -1, "", f"Command timed out after {timeout} seconds"
+    except Exception as e:
+        return -1, "", str(e)
+
+
+def print_info(msg: str):
+    """Print an info-level message."""
+    print(f"[INFO] {msg}")
+
+
+def print_error(msg: str):
+    """Print an error-level message to stderr."""
+    print(f"[ERROR] {msg}", file=sys.stderr)
+
+
+def import_env_from_file(config_path: Optional[Path] = None) -> List[str]:
+    """
+    Load environment variables from a properties file.
+
+    This function reads a configuration file (default: 'config.properties')
+    and exports each key-value pair as an environment variable.
+
+    Args:
+        config_path (Path, optional): Path to the config file.
+            If not provided, defaults to 'config.properties' in the script's directory.
+
+    Returns:
+        List[str]: List of environment variable names that were successfully loaded.
+
+    Raises:
+        SystemExit: If the config file does not exist.
+    """
+
+    # Determine config file path
+    config_file = config_path or CODE_ROOT / "config.properties"
+
+    # Check if config file exists
+    if not config_file.exists():
+        print(f"Configuration file not found: {config_file}", file=sys.stderr)
+        sys.exit(1)
+
+    print("\n========================================")
+    print("Loading environment variables from config file:")
+    print("========================================")
+    time.sleep(2)
+
+    loaded_vars = []
+
+    try:
+        with open(config_file, "r", encoding="utf-8") as f:
+            for line_num, line in enumerate(f, start=1):
+                line = line.strip()
+
+                # Skip empty lines and comments
+                if not line or line.startswith("#"):
+                    continue
+
+                # Ensure line has exactly one '='
+                if line.count("=") != 1:
+                    print(f"Invalid format on line {line_num}: {line}", file=sys.stderr)
+                    continue
+
+                key, value = line.split("=", 1)
+                key = key.strip()
+                value = value.strip()
+
+                # Skip if key is empty
+                if not key:
+                    print(f"Empty variable name on line {line_num}", file=sys.stderr)
+                    continue
+
+                # Set environment variable
+                os.environ[key] = value
+                loaded_vars.append(key)
+
+                # Print exported variable
+                print(f"export {key}={value}")
+
+    except PermissionError:
+        print(
+            f"Permission denied when reading config file: {config_file}",
+            file=sys.stderr,
+        )
+        sys.exit(1)
+    except Exception as e:
+        print(f"Unexpected error while reading config file: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    print("========================================")
+    print(f"Successfully loaded {len(loaded_vars)} environment variables.")
+    print("========================================")
+    time.sleep(2)
+
+
+def check_ssh_login(ip: str) -> bool:
+    """
+    Test SSH passwordless login to a remote host.
+
+    Args:
+        ip: IP address of the remote host.
+
+    Returns:
+        True if SSH login succeeds without password prompt; False otherwise.
+    """
+    cmd = [
+        "ssh",
+        "-o",
+        "BatchMode=yes",
+        "-o",
+        "ConnectTimeout=5",
+        "-i",
+        str(LOCAL_SSH_KEY),
+        f"root@{ip}",
+        "exit",
+    ]
+    return run_command(cmd, check=False)[0] == 0
+
+
+def setup_ssh_key(ip: str) -> None:
+    """
+    Configure passwordless SSH login for a remote host.
+
+    Steps:
+        1. Ensure local SSH key pair exists (generate if missing).
+        2. Upload public key to the remote host using ssh-copy-id.
+        3. Verify that passwordless SSH login works.
+
+    Args:
+        ip: IP address of the target remote host.
+
+    Raises:
+        SystemExit: If any step fails (e.g., key generation, upload, or verification).
+    """
+    print(f"[UC] Configuring passwordless SSH login for {ip}...")
+
+    # Ensure local SSH key pair exists
+    if not LOCAL_SSH_KEY.exists():
+        print_info(f"Generating new SSH key pair: {LOCAL_SSH_KEY}")
+        ret, _, err = run_command(
+            [
+                "ssh-keygen",
+                "-t",
+                "rsa",
+                "-b",
+                "4096",
+                "-f",
+                str(LOCAL_SSH_KEY),
+                "-N",
+                "",  # No passphrase
+            ]
+        )
+        if ret != 0:
+            print_error(f"Failed to generate SSH key: {err}")
+            # sys.exit(1)
+            return False
+
+    # Upload public key to remote host
+    print_info(f"Uploading public key to {ip} (please enter password manually)...")
+    ret, out, err = run_command(["ssh-copy-id", "-i", str(LOCAL_SSH_KEY), f"root@{ip}"])
+
+    if ret != 0:
+        print_error(f"Failed to upload public key: {err}")
+        return False
+
+    # Verify passwordless SSH login
+    if check_ssh_login(ip):
+        print_info(f"Passwordless SSH login configured successfully for {ip}!")
+    else:
+        print_error(
+            f"Failed to verify passwordless SSH login for {ip}. "
+            "Please check network connectivity, SSH service, or user permissions."
+        )
+        # sys.exit(1)
+        return False
+
+
+def run_set_ssh_login() -> Dict[str, Any]:
+    """
+    Configure passwordless SSH login for master and worker nodes.
+
+    This function checks and sets up SSH key-based authentication
+    for the master and worker nodes defined via environment variables.
+
+    Returns:
+        A dictionary containing the configuration status for each node,
+        along with a global success flag.
+
+        Example structure:
+        {
+            "MASTER_IP": {
+                "ip": "192.168.1.1",
+                "status": True,
+            },
+            "WORKER_IP": {
+                "ip": "192.168.1.2",
+                "status": False,
+            },
+            "SSH_CHECK": True  # Overall success status
+        }
+    """
+    print("\n" + "-" * 40 + "\n")
+    print("Configuring passwordless SSH login for remote hosts")
+
+    results: Dict[str, Dict[str, Any]] = {}
+    all_success = True  # Track overall operation success
+
+    # Build IP mapping
+    ip_map: Dict[str, Optional[str]] = {"MASTER_IP": MASTER_IP}
+    if WORKER_IP:
+        ip_map["WORKER_IP"] = WORKER_IP
+
+    # Process each target host
+    for key, ip in ip_map.items():
+        if not ip:
+            result = {
+                "ip": "",
+                "status": False,
+            }
+            results[key] = result
+            all_success = False
+            continue
+
+        result = {
+            "ip": ip,
+            "status": False,
+        }
+
+        print(f"\nProcessing IP: {ip}")
+
+        try:
+            # Step 1: Check if passwordless SSH is already working
+            if check_ssh_login(ip):
+                result["status"] = True
+                print_info(f"{ip} - Passwordless login already available")
+            else:
+                # Step 2: Set up SSH key (will prompt for password)
+                print_info(f"Setting up SSH key for {ip}...")
+                setup_ssh_key(ip)
+
+                # Step 3: Re-check after setup
+                if check_ssh_login(ip):
+                    result["status"] = True
+                else:
+                    result["status"] = False
+
+        except Exception as e:
+            result["status"] = False
+            print_error(f"Error processing {ip}: {e}")
+
+        # Update overall success flag
+        if not result["status"]:
+            all_success = False
+
+        results[key] = result
+
+    # Final global success indicator
+    results["SSH_CHECK"] = all_success
+
+    return results
+
+
+def run_remote(ip, script, env=None, raise_on_error=True):
+    """
+    Execute a Bash script remotely via SSH, print output in real-time,
+    and return the full output.
+
+    Args:
+        ip (str): Remote host IP address
+        script (str): Bash script content to execute
+        env (dict, optional): Environment variables to set before execution
+        raise_on_error (bool): Whether to raise an exception if remote command fails
+
+    Returns:
+        str: Full output of the executed script
+
+    Raises:
+        Exception: If the remote command fails and raise_on_error=True
+    """
+    exports = ""
+    if env:
+        for k, v in env.items():
+            exports += f'export {k}="{v}"\n'
+
+    # Start SSH process with bash -s
+    process = subprocess.Popen(
+        ["ssh", "-q", "-i", str(LOCAL_SSH_KEY), f"root@{ip}", "bash", "-s"],
+        stdin=subprocess.PIPE,
+        stdout=subprocess.PIPE,
+        stderr=subprocess.STDOUT,
+        text=True,
+    )
+
+    # Send environment exports and script
+    process.stdin.write(exports + "\n" + script + "\n")
+    process.stdin.close()
+
+    # Read and print output line by line in real-time
+    output_lines = []
+    for line in process.stdout:
+        print(line, end="")  # 实时打印
+        output_lines.append(line)
+
+    process.wait()
+    full_output = "".join(output_lines)
+
+    return full_output
+
+
+def parse_hccn_output(output):
+    """
+    Parse output from both HCCN (Ascend) and NVIDIA styles and unify the result.
+    Unified output format: { item: {status: bool, output: str}}
+    """
+    result_dict = {}
+
+    current_item = None
+    current_lines = []
+
+    for raw_line in output.splitlines():
+        line = raw_line.strip()
+
+        # ========== Ascend ==========
+        # Start Detection：xxx
+        if line.startswith("Start Detection："):
+            current_item = line.replace("Start Detection：", "").strip()
+            current_lines = []
+            continue
+
+        # [RESULT] xxx: Success/Failed
+        if line.startswith("[RESULT]"):
+            if current_item:
+                status_str = line.split(":", 1)[1].strip()
+                passed = status_str.startswith("Success")
+
+                result_dict[current_item] = {
+                    "status": passed,
+                    "output": "\n".join(current_lines).strip(),
+                }
+
+                current_item = None
+                current_lines = []
+            continue
+
+        # ========== NVIDIA ==========
+        # [Detection] xxx
+        if line.startswith("[Detection]"):
+            current_item = line.replace("[Detection]", "").strip()
+            current_lines = []
+            continue
+
+        # Pass：xxx
+        if line.startswith("Pass："):
+            item = line.replace("Pass：", "").strip()
+
+            result_dict[item] = {
+                "status": True,
+                "output": "\n".join(current_lines).strip(),
+            }
+
+            current_item = None
+            current_lines = []
+            continue
+
+        # Failed：xxx
+        if line.startswith("Failed："):
+            item = line.replace("Failed：", "").strip()
+
+            result_dict[item] = {
+                "status": False,
+                "output": "\n".join(current_lines).strip(),
+            }
+
+            current_item = None
+            current_lines = []
+            continue
+
+        if current_item:
+            current_lines.append(line)
+
+    return result_dict
+
+
+def run_hccn_device_status_check():
+    """
+    Run a series of HCCN (Huawei Cloud Computing Network) device status checks
+    on the target node via remote execution. This includes checking link neighbors,
+    physical link status, network health, IP configuration, and gateway settings
+    for all Ascend AI accelerators.
+
+    The function uses the 'hccn_tool' command-line utility to query device information
+    and verifies the health and connectivity of the Ascend cards in the system.
+
+    Returns:
+        dict: A dictionary containing the result of each check, parsed from the output.
+    """
+    HCCN_STATUS_CHECK_SCRIPT = r"""
+run_check() {
+    cmd="$1"
+    desc="$2"
+    echo "Start Detection：$desc"
+    if eval "$cmd"; then
+        echo "[RESULT] $desc: Success"
+        return 0
+    else
+        echo "[RESULT] $desc: Failed (code=$?)" >&2
+        return 1
+    fi
+}
+
+run_check "for i in $(echo \"$ASCEND_RT_VISIBLE_DEVICES\" | tr ',' ' ' | xargs); do hccn_tool -i \$i -lldp -g | grep Ifname; done" "link_neighbor_status"
+run_check "for i in $(echo \"$ASCEND_RT_VISIBLE_DEVICES\" | tr ',' ' ' | xargs); do hccn_tool -i \$i -link -g; done" "physical_link_status"
+run_check "for i in $(echo \"$ASCEND_RT_VISIBLE_DEVICES\" | tr ',' ' ' | xargs); do hccn_tool -i \$i -net_health -g; done" "network_health_status"
+run_check "for i in $(echo \"$ASCEND_RT_VISIBLE_DEVICES\" | tr ',' ' ' | xargs); do hccn_tool -i \$i -ip -g; done" "gpu_ip_config"
+run_check "for i in $(echo \"$ASCEND_RT_VISIBLE_DEVICES\" | tr ',' ' ' | xargs); do hccn_tool -i \$i -gateway -g; done" "gateway_config"
+"""
+    print("\n----------------------------------------\n")
+    print(f"[UC] Starting to check the Ascend card status, node IP: {MASTER_IP}")
+    os.environ["ASCEND_RT_VISIBLE_DEVICES"] = ASCEND_RT_VISIBLE_DEVICES
+    output = run_remote(
+        MASTER_IP,
+        HCCN_STATUS_CHECK_SCRIPT,
+        env={"ASCEND_RT_VISIBLE_DEVICES": ASCEND_RT_VISIBLE_DEVICES},
+    )
+
+    # Parsing Output
+    result_dict = parse_hccn_output(output)
+
+    return result_dict
+
+
+def run_nvidia_device_status_check():
+    """
+    Execute a comprehensive set of NVIDIA GPU device status checks
+    on the target node via remote execution. This includes verifying:
+    - Driver loading,
+    - GPU device detection,
+    - GPU temperature (<85°C),
+    - Physical link status (PCIe) for each GPU,
+    - Full interconnection topology (using 'nvidia-smi topo -m'),
+    - CUDA compiler availability and version.
+
+    The script uses standard NVIDIA tools like 'nvidia-smi', 'lsmod', and 'nvcc'
+    to validate the health and configuration of the GPU system.
+
+    Returns:
+        dict: A dictionary containing the result of each check, parsed from the output.
+    """
+    NVIDIA_STATUS_CHECK_SCRIPT = r"""
+run_check() {
+    cmd="$1"
+    desc="$2"
+    echo "[Detection] $desc"
+    if eval "$cmd"; then
+        echo "Pass：$desc"
+        return 0
+    else
+        echo "Failed：$desc (code=$?)" >&2
+        return 1
+    fi
+}
+
+run_check "lsmod | grep -q nvidia" "Check the driver loading"
+run_check "nvidia-smi -L | grep -q GPU" "Checking the Device List"
+run_check "nvidia-smi -q | awk '/GPU Current Temp/ && \$6!=\"N/A\" {exit \$4>85?1:0}'" "Check temperature (<85°C)"
+
+GPU_COUNT=$(nvidia-smi -L | wc -l)
+
+for i in $(seq 0 $((GPU_COUNT-1))); do
+    run_check "nvidia-smi -i $i -q | grep -q 'GPU Link Info'" "Check the physical link information of GPU$i" "WARN"
+done
+
+run_check "nvidia-smi topo -m | awk 'BEGIN{all_ok=1} /^GPU/ {for(i=2;i<=NF;i++) if($i==\"-\") all_ok=0} END{exit !all_ok}'" "Check full card interconnection" "WARN"
+run_check "nvcc --version | grep -q 'release'" "CUDA version"
+"""
+    print("\n----------------------------------------\n")
+    print(f"[UC] Starting to check the NVIDIA card status, node IP: {MASTER_IP}")
+    output = run_remote(MASTER_IP, NVIDIA_STATUS_CHECK_SCRIPT)
+
+    # Parsing Output
+    result_dict = parse_hccn_output(output)
+
+    return result_dict
+
+
+def get_remote_card_ips(ip: str, card_ids: str):
+    remote_cmd = f"""
+tool="/usr/local/Ascend/driver/tools/hccn_tool"
+IFS=',' read -ra card_array <<< "{card_ids}"
+declare -a ips
+for card_id in "${{card_array[@]}}"; do
+    output=$("$tool" -i "$card_id" -ip -g 2>/dev/null)
+    ip=$(echo "$output" | grep -oP "ipaddr:\\K[\\d.]+" || echo "")
+    [ -n "$ip" ] && ips+=("$ip")
+done
+printf "%s\\n" "${{ips[@]}}" | sort -V
+"""
+    try:
+        result = subprocess.run(
+            f"ssh -i \"{str(LOCAL_SSH_KEY)}\" root@{ip} bash -c '{remote_cmd}'",
+            shell=True,
+            capture_output=True,
+            text=True,
+            check=True,
+        )
+
+        return result.stdout.strip().splitlines()
+    except subprocess.CalledProcessError:
+        print(f"Failed to get NPU card IPs on remote machine {ip}", file=sys.stderr)
+        sys.exit(1)
+
+
+def remote_hccn_card_ping_test(ip: str, card_ids: str):
+    """
+    Execute HCCN card intra-node ping test on a remote machine (SSH + execution + structured results)
+    :param ip: remote machine IP
+    :param card_ids: list of card IDs, e.g., "0,1,2,3"
+    :return: result_dict
+    """
+
+    remote_cmd = f"""
+function intra_node_hccn_card_ping_test() {{
+    IFS=',' read -ra card_array <<< "{card_ids}"
+    declare -A card_ip_map
+
+    tool="/usr/local/Ascend/driver/tools/hccn_tool"
+
+    echo "[INFO] Retrieving HCCN card IPs..."
+
+    # Step 1: get IP address for each card
+    for card_id in "${{card_array[@]}}"; do
+        output=$("$tool" -i "$card_id" -ip -g 2>/dev/null)
+        ip=$(echo "$output" | grep -oP "ipaddr:\\K[\\d.]+" || echo "")
+        if [ -n "$ip" ]; then
+            card_ip_map[$card_id]="$ip"
+        else
+            echo "[RESULT] card_$card_id: Failed to get IP"
+        fi
+    done
+
+    if [ ${{#card_ip_map[@]}} -eq 0 ]; then
+        echo "[FATAL] No HCCN card IPs detected"
+        return
+    fi
+
+    echo "[INFO] Retrieved card IP mapping:"
+    for k in "${{!card_ip_map[@]}}"; do
+        echo "  Card $k -> ${{card_ip_map[$k]}}"
+    done
+
+    # Step 2: ping test between HCCN cards
+    for src_id in "${{!card_ip_map[@]}}"; do
+        for dst_id in "${{!card_ip_map[@]}}"; do
+            if [ "$src_id" != "$dst_id" ]; then
+                pair="local_card_${{src_id}} to local_card_${{dst_id}}"
+                dst_ip="${{card_ip_map[$dst_id]}}"
+
+                echo "[TEST] $pair ($dst_ip)"
+
+                if "$tool" -i "$src_id" -ping -g address "$dst_ip" >/dev/null 2>&1; then
+                    echo "[RESULT] $pair: Success"
+                else
+                    echo "[RESULT] $pair: Failed"
+                fi
+            fi
+        done
+    done
+}}
+
+intra_node_hccn_card_ping_test
+"""
+
+    print(f"\n[INFO] Start Detection {ip} HCCN card intra-node Ping...")
+
+    escaped_cmd = shlex.quote(remote_cmd)
+
+    ssh_cmd = [
+        "ssh",
+        "-q",
+        "-o",
+        "LogLevel=ERROR",
+        "-o",
+        "StrictHostKeyChecking=no",
+        "-o",
+        "UserKnownHostsFile=/dev/null",
+        "-i",
+        str(LOCAL_SSH_KEY),
+        f"root@{ip}",
+        "bash",
+        "-c",
+        escaped_cmd,
+    ]
+
+    process = subprocess.Popen(
+        ssh_cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, text=True, bufsize=1
+    )
+
+    output_lines = []
+    for line in process.stdout:
+        print(line, end="")
+        output_lines.append(line.strip())
+
+    process.wait()
+
+    result_dict = {}
+
+    for line in output_lines:
+        if line.startswith("[RESULT]"):
+            line = line.replace("[RESULT]", "").strip()
+            key, status_part = line.split(":", 1)
+            status = status_part.strip().startswith("Success")
+
+            result_dict[key.strip()] = {"status": status, "output": ""}
+
+    return result_dict
+
+
+def remote_local_hccn_cards_ping_test(
+    src_type: str, src_ip: str, src_card: str, dst_ip: str
+):
+    """
+    Local or remote HCCN card ping test, return unified result_dict
+    :param src_type: "local" or "remote"
+    :param src_ip: remote machine IP (if src_type=="remote")
+    :param src_card: source card ID
+    :param dst_ip: destination IP
+    :return: dict -> { "card_X_to_card_Y": {"status": True/False, "output": "..."}, "global_status": {...} }
+    """
+    if src_type == "local":
+        print(f"[TEST] LOCAL card {src_card} → REMOTE {dst_ip}")
+        pair_key = f"local_card_{src_card} to remote_{dst_ip.replace('.', '_')}"
+        cmd = f"hccn_tool -i {src_card} -ping -g address {dst_ip}"
+    else:
+        print(f"[TEST] REMOTE {src_ip} card {src_card} → LOCAL {dst_ip}")
+        pair_key = f"remote_card_{src_card} to local_{dst_ip.replace('.', '_')}"
+        cmd = f'ssh -i "{str(LOCAL_SSH_KEY)}" root@{src_ip} hccn_tool -i {src_card} -ping -g address {dst_ip}'
+
+    result_dict = {pair_key: {"status": False, "output": ""}}
+    try:
+        completed = subprocess.run(cmd, shell=True, capture_output=True, text=True)
+        if completed.returncode == 0 and src_type == "local":
+            print(f"[RESULT] LOCAL card {src_card} → REMOTE {dst_ip}: Success")
+        elif completed.returncode == 0 and src_type == "remote":
+            print(f"[RESULT] REMOTE {src_ip} card {src_card} → LOCAL {dst_ip}: Success")
+        elif src_type == "local":
+            print(f"[RESULT] LOCAL card {src_card} → REMOTE {dst_ip}: Failed")
+        elif src_type == "remote":
+            print(f"[RESULT] REMOTE {src_ip} card {src_card} → LOCAL {dst_ip}: Failed")
+
+        result_dict[pair_key]["status"] = completed.returncode == 0
+
+    except Exception as e:
+        result_dict[pair_key]["status"] = False
+
+    # Calculate global status (only one ping here, caller can aggregate multiple pings)
+    result_dict["global_status"] = {
+        "status": result_dict[pair_key]["status"],
+        "output": "HCCN local/remote ping global status",
+    }
+
+    return result_dict
+
+
+def run_check_hccn_ping():
+    """
+    Execute HCCN card ping test including master intra-node ping, local<->remote ping, and remote inter-node ping.
+    Returns unified result_dict with global status.
+    """
+    # ASCEND_RT_VISIBLE_DEVICES = os.environ.get("ASCEND_RT_VISIBLE_DEVICES", "")
+
+    print("\n----------------------------------------\n")
+    print("[UC] start check HCCN ping. Please ensure running at master machine.")
+
+    all_results = {}
+
+    # Get master node card IP list
+    local_card_ips = get_remote_card_ips(MASTER_IP, ASCEND_RT_VISIBLE_DEVICES)
+    remote_machines = WORKER_IP.split(",") if WORKER_IP else []
+
+    # 1. Master node intra-card ping
+    master_result = remote_hccn_card_ping_test(MASTER_IP, ASCEND_RT_VISIBLE_DEVICES)
+    all_results.update(master_result)
+
+    # 2. Local <-> Remote node ping
+    if NODE_NUM > 1:
+        print("\n[INFO] === Local <-> Remote node ping test ===")
+        for remote_ip in remote_machines:
+            remote_card_ips = get_remote_card_ips(remote_ip, ASCEND_RT_VISIBLE_DEVICES)
+
+            # Local ping remote
+            print(f"[INFO] Master node card ping remote node {remote_ip} ...")
+            for local_idx, local_ip in enumerate(local_card_ips):
+                for remote_card_ip in remote_card_ips:
+                    res = remote_local_hccn_cards_ping_test(
+                        "local", "", local_idx, remote_card_ip
+                    )
+                    all_results.update(res)
+
+            # Remote ping local
+            print(f"[INFO] Remote node {remote_ip} card ping Master node ...")
+            for remote_idx, remote_card_ip in enumerate(remote_card_ips):
+                for local_ip_card in local_card_ips:
+                    res = remote_local_hccn_cards_ping_test(
+                        "remote", remote_ip, remote_idx, local_ip_card
+                    )
+                    all_results.update(res)
+
+    # 3. Remote inter-node ping
+    if len(remote_machines) > 1:
+        print("\n[INFO] === Remote inter-node ping test ===")
+        for i in range(len(remote_machines)):
+            for j in range(i + 1, len(remote_machines)):
+                ip1, ip2 = remote_machines[i], remote_machines[j]
+                ips1 = get_remote_card_ips(ip1, ASCEND_RT_VISIBLE_DEVICES)
+                ips2 = get_remote_card_ips(ip2, ASCEND_RT_VISIBLE_DEVICES)
+
+                # ip1 -> ip2
+                print(f"[INFO] Node {ip1} ping Node {ip2} ...")
+                for idx1, card1_ip in enumerate(ips1):
+                    for card2_ip in ips2:
+                        res = remote_local_hccn_cards_ping_test(
+                            "remote", ip1, idx1, card2_ip
+                        )
+                        all_results.update(res)
+
+                # ip2 -> ip1
+                print(f"[INFO] Node {ip2} ping Node {ip1} ...")
+                for idx2, card2_ip in enumerate(ips2):
+                    for card1_ip in ips1:
+                        res = remote_local_hccn_cards_ping_test(
+                            "remote", ip2, idx2, card1_ip
+                        )
+                        all_results.update(res)
+
+    # Calculate global status
+    global_status = all(
+        r["status"] for k, r in all_results.items() if k != "global_status"
+    )
+    all_results["hccn_ping_check"] = {"status": global_status}
+
+    return all_results
+
+
+def run_check_nvidia_ping():
+    """
+    Master <-> Worker ping test in multi-node environment
+    :return: result_dict -> { "master->WORKER_IP": {"status": True/False, "output": "..."},
+                               "WORKER_IP->master": {...}, "global_status": True/False }
+    """
+    print("\n----------------------------------------\n")
+    print("[UC] start check NVIDIA ping. Please ensure running at master machine.\n")
+
+    remote_machines = WORKER_IP.split(",") if WORKER_IP else []
+    result_dict = {}
+
+    if NODE_NUM > 1:
+        print(
+            "--------------------------NVIDIA multi-node environment: test ping between nodes -----------------------------\n"
+        )
+
+        for remote_ip in remote_machines:
+            # master -> worker
+            pair_key = f"master {MASTER_IP}-> worker {remote_ip}"
+            print(f"Testing ping: master {MASTER_IP} --> worker {remote_ip}")
+            ping_cmd = f"ping -c 4 -W 1 {remote_ip}"
+            completed = subprocess.run(
+                ping_cmd, shell=True, capture_output=True, text=True
+            )
+            output_text = (
+                (completed.stdout or "").strip()
+                + "\n"
+                + (completed.stderr or "").strip()
+            )
+            status = completed.returncode == 0
+            result_dict[pair_key] = {
+                "status": status,
+                "output": output_text if status else f"Failed\n{output_text}",
+            }
+            print(f"{pair_key} {'Ping OK' if status else 'Ping Failed'}\n")
+
+            # worker -> master
+            pair_key = f"worker {remote_ip}-> master {MASTER_IP}"
+            print(f"Testing ping: worker {remote_ip} --> master {MASTER_IP}")
+            ssh_ping_cmd = (
+                f"ssh -q -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null "
+                f'-o LogLevel=ERROR -o ConnectTimeout=5 -i "{str(LOCAL_SSH_KEY)}" '
+                f'root@{remote_ip} "ping -c 4 -W 1 {MASTER_IP}"'
+            )
+            completed = subprocess.run(
+                ssh_ping_cmd, shell=True, capture_output=True, text=True
+            )
+            output_text = (
+                (completed.stdout or "").strip()
+                + "\n"
+                + (completed.stderr or "").strip()
+            )
+            status = completed.returncode == 0
+            result_dict[pair_key] = {
+                "status": status,
+            }
+            print(f"{pair_key} {'Ping OK' if status else 'Ping Failed'}\n")
+
+    # Calculate global status
+    global_status = (
+        all(v["status"] for v in result_dict.values()) if result_dict else True
+    )
+    result_dict["nvidia_ping_check"] = {"status": global_status}
+
+    return result_dict
+
+
+def run_hccn_tls_check(MASTER_IP: str, WORKER_IP: str) -> Dict[str, Any]:
+    """
+    Check whether the TLS switch of all HCCN cards on master and worker nodes is 0.
+    Card IDs are read from the ASCEND_RT_VISIBLE_DEVICES environment variable, e.g., "0,1".
+
+    Return format:
+    {
+        "tls_check": {
+            "status": True/False,
+            "master_card_0": {"card_id": "0", "status": True},
+            "master_card_1": {"card_id": "1", "status": False},
+            "worker_card_0": {"card_id": "0", "status": True},
+            ...
+        }
+    }
+    """
+
+    global TLS_CHECK_RESULT
+    TLS_CHECK_RESULT = True
+
+    print("\n----------------------------------------\n")
+    print(f"[UC] Starting to check the HCCN card TLS status")
+    devices = ASCEND_RT_VISIBLE_DEVICES
+    if not devices:
+        raise EnvironmentError(
+            "Environment variable ASCEND_RT_VISIBLE_DEVICES is not set"
+        )
+
+    card_ids = [c.strip() for c in devices.split(",") if c.strip()]
+    if not card_ids:
+        raise ValueError(f"Failed to parse ASCEND_RT_VISIBLE_DEVICES: {devices}")
+
+    result: Dict[str, Any] = {"tls_check": {"status": True}}
+
+    def check_node(node_ip: str, node_prefix: str):
+        """
+        Check TLS switch status on a single node for all HCCN cards.
+        """
+        global TLS_CHECK_RESULT
+        if not node_ip:
+            return
+
+        for card_id in card_ids:
+            # Construct SSH command
+            print(f"[TEST] {node_prefix}_card_{card_id} ({node_ip}) TLS checking...")
+            cmd = (
+                f"ssh -i {str(LOCAL_SSH_KEY)} -q -o LogLevel=ERROR -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null root@{node_ip} "
+                f"'{shlex.quote(f'/usr/local/Ascend/driver/tools/hccn_tool -i {card_id} -tls -g | head -n 1')}'"
+            )
+
+            try:
+                output = subprocess.check_output(
+                    cmd, shell=True, text=True, stderr=subprocess.DEVNULL
+                ).strip()
+            except subprocess.CalledProcessError:
+                status = False
+            else:
+                # Extract TLS switch value from the first line
+                import re
+
+                match = re.search(r"tls switch\[(\d+)\]", output)
+                if match and match.group(1) == "0":
+                    status = True
+                else:
+                    status = False
+
+            key = f"{node_prefix}_card_{card_id}"
+            result["tls_check"][key] = {"card_id": card_id, "status": status}
+
+            if status:
+                print(f"[RESULT] {node_prefix}_card_{card_id}: PASS (switch=0)")
+            else:
+                print(f"[RESULT] {node_prefix}_card_{card_id}: FAIL")
+                TLS_CHECK_RESULT = False
+
+    # Check master node
+    check_node(MASTER_IP, "master")
+    # Check worker node
+    check_node(WORKER_IP, "worker")
+
+    result["tls_check"]["status"] = TLS_CHECK_RESULT
+    return result
+
+
+MODEL_WEIGHT_FILES_LIST = []
+
+
+def get_llm_weight_files_list(MODEL_PATH, result_dict):
+    global MODEL_WEIGHT_FILES_LIST
+    result_dict["get_llm_weight_files_list"] = {"status": False, "output": ""}
+
+    print(f"[UC] Get LLM weight files list: {MODEL_PATH}")
+
+    if not os.path.isdir(MODEL_PATH):
+        msg = f"Directory does not exist: {MODEL_PATH}"
+        print(msg, file=sys.stderr)
+        result_dict["get_llm_weight_files_list"]["output"] = msg
+        return result_dict
+
+    os.chdir(MODEL_PATH)
+
+    print("\nSearching for all .safetensors files...")
+    MODEL_WEIGHT_FILES_LIST = [
+        f for f in os.listdir(".") if f.endswith(".safetensors") and os.path.isfile(f)
+    ]
+
+    print(f"Found {len(MODEL_WEIGHT_FILES_LIST)} files")
+
+    if len(MODEL_WEIGHT_FILES_LIST) == 0:
+        msg = f"No weight files found in {MODEL_PATH}"
+        print(msg, file=sys.stderr)
+        result_dict["get_llm_weight_files_list"]["output"] = msg
+        return result_dict
+
+    if len(MODEL_WEIGHT_FILES_LIST) > 1:
+        # Extract N-of-M pattern from filenames
+        total_chunks_from_names = 0
+        for f in MODEL_WEIGHT_FILES_LIST:
+            match = re.search(r"(\d+)-of-(\d+)", f)
+            if match:
+                total_chunks_from_names = int(match.group(2).lstrip("0") or 0)
+                break
+
+        actual_file_count = len(MODEL_WEIGHT_FILES_LIST)
+
+        if total_chunks_from_names == actual_file_count:
+            print(
+                f"Validation passed: Total chunks in filenames ({total_chunks_from_names}) matches actual count ({actual_file_count})"
+            )
+        else:
+            msg = (
+                f"Validation failed: Total chunks in filenames {total_chunks_from_names}, "
+                f"but actually found {actual_file_count} files"
+            )
+            print(msg, file=sys.stderr)
+            result_dict["get_llm_weight_files_list"]["output"] = msg
+            return result_dict
+
+    result_dict["get_llm_weight_files_list"]["status"] = True
+    return result_dict
+
+
+def get_weight_files_hash(MODEL_PATH, HF_MODEL_NAME, MIDDLE_PAGE, result_dict):
+    result_dict["get_weight_files_hash"] = {"status": False, "output": ""}
+
+    output_path = os.path.join(MODEL_PATH, f"{HF_MODEL_NAME}.sha256")
+
+    if not os.path.exists(output_path):
+        print(
+            "Weight hash file does not exist, retrieving from HuggingFace. Ensure internet access!"
+        )
+
+        for file in MODEL_WEIGHT_FILES_LIST:
+            weight_file = file.replace("./", "")
+            page = f"https://huggingface.co/{MIDDLE_PAGE}/{HF_MODEL_NAME}/blob/main/{weight_file}"
+
+            max_retry = 3
+            retry_delay = 2
+            hash_value = ""
+
+            for i in range(1, max_retry + 1):
+                try:
+                    cmd = (
+                        f'curl -fsSL -k --connect-timeout 10 "{page}" | '
+                        r'grep -oE "[a-f0-9]{64}" | head -n 1'
+                    )
+                    result = subprocess.check_output(
+                        cmd, shell=True, stderr=subprocess.DEVNULL
+                    )
+                    hash_value = result.decode().strip()
+
+                    if re.fullmatch(r"[a-f0-9]{64}", hash_value):
+                        break
+
+                    if i < max_retry:
+                        print(f"Request failed, retry {i}...", file=sys.stderr)
+                        time.sleep(retry_delay)
+
+                except subprocess.CalledProcessError:
+                    pass
+
+            if not re.fullmatch(r"[a-f0-9]{64}", hash_value):
+                msg = f"Cannot get valid hash: {weight_file}"
+                print(msg, file=sys.stderr)
+                result_dict["get_weight_files_hash"]["output"] = msg
+                return result_dict
+
+            with open(output_path, "a", encoding="utf-8") as f:
+                f.write(f"{hash_value}  {file}\n")
+
+    else:
+        print(f"{output_path} already exists")
+
+    result_dict["get_weight_files_hash"]["status"] = True
+    return result_dict
+
+
+def run_check_model_weight():
+    result_dict = {}
+
+    print("\n----------------------------------------\n")
+    print(f"[UC] Check model weight: {MODEL_PATH}")
+
+    # Step 1: Get model files list
+    result_dict = get_llm_weight_files_list(MODEL_PATH, result_dict)
+
+    # Step 2: Get HuggingFace hash
+    if result_dict.get("get_llm_weight_files_list", {}).get("status"):
+        result_dict = get_weight_files_hash(
+            MODEL_PATH, HF_MODEL_NAME, MIDDLE_PAGE, result_dict
+        )
+    else:
+        result_dict["global_status"] = {"status": False}
+        return result_dict
+
+    # Step 3: Verify sha256
+    result_dict["sha256_verification"] = {"status": False, "output": ""}
+    os.chdir(MODEL_PATH)
+    sha256_files = [f for f in os.listdir(".") if f.endswith(".sha256")]
+
+    if len(sha256_files) == 0:
+        msg = "Error: No .sha256 files found"
+        print(msg, file=sys.stderr)
+        result_dict["sha256_verification"]["output"] = msg
+    elif len(sha256_files) > 1:
+        msg = f"Error: Multiple .sha256 files found: {sha256_files}"
+        print(msg, file=sys.stderr)
+        result_dict["sha256_verification"]["output"] = msg
+    else:
+        sha256_file = sha256_files[0]
+        try:
+            subprocess.check_call(f"sha256sum -c {sha256_file}", shell=True)
+            print("All .safetensors files verified successfully")
+            result_dict["sha256_verification"]["status"] = True
+        except subprocess.CalledProcessError:
+            msg = "Model weight verification failed, exiting"
+            print(msg, file=sys.stderr)
+            result_dict["sha256_verification"]["output"] = msg
+
+    # Calculate global status
+    global_status = all(v.get("status", False) for k, v in result_dict.items())
+    result_dict["model_weight_check"] = {"status": global_status}
+
+    return result_dict
+
+
+class StdoutInterceptor:
+    """
+    Intercepts all stdout and stderr output from both C++ and Python code,
+    and prevents it from being printed directly to the console.
+
+    This is useful for capturing logs programmatically for filtering or analysis.
+    """
+
+    def __enter__(self):
+        # Save original stdout and stderr file descriptors
+        self.original_stdout = os.dup(1)
+        self.original_stderr = os.dup(2)
+
+        # Create a pipe to capture output
+        self.pipe_out_r, self.pipe_out_w = os.pipe()
+
+        # Redirect stdout and stderr to the pipe
+        os.dup2(self.pipe_out_w, 1)
+        os.dup2(self.pipe_out_w, 2)
+        os.close(self.pipe_out_w)
+
+        self.logs = []
+        self._stop_thread = False
+
+        # Start a background thread to read from the pipe continuously
+        self.thread = threading.Thread(target=self._read_pipe)
+        self.thread.daemon = True
+        self.thread.start()
+        return self
+
+    def _read_pipe(self):
+        # Continuously read from the pipe until stopped
+        while not self._stop_thread:
+            try:
+                chunk = os.read(self.pipe_out_r, 4096)
+                if chunk:
+                    text = chunk.decode()
+                    self.logs.append(text)
+                    # Do not print to terminal; logs are kept internally
+                else:
+                    time.sleep(0.01)
+            except OSError:
+                break
+
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        # Stop background thread and restore stdout/stderr
+        self._stop_thread = True
+        time.sleep(0.05)
+        try:
+            os.close(self.pipe_out_r)
+        except OSError:
+            pass
+        os.dup2(self.original_stdout, 1)
+        os.dup2(self.original_stderr, 2)
+        os.close(self.original_stdout)
+        os.close(self.original_stderr)
+
+    def read(self):
+        """Return all captured logs as a single string."""
+        return "".join(self.logs)
+
+
+def setup_uc(block_size):
+    """
+    Initialize UC (Unified Cache) with a given block size.
+
+    Args:
+        block_size (int): Total block size in bytes for UC setup.
+
+    Raises:
+        RuntimeError: if ucmstore.Setup returns a non-zero value.
+    """
+    param = ucmstore.SetupParam(STORAGE_BACKENDS, block_size, True)
+    ret = ucmstore.Setup(param)
+    if ret != 0:
+        raise RuntimeError(f"ucmstore.Setup failed: ret={ret}")
+
+
+def filter_task_logs(logs):
+    """
+    Filter UC output logs to extract only lines containing Task information,
+    including task_id and bandwidth.
+
+    Args:
+        logs (str): Raw UC logs.
+
+    Returns:
+        str: Filtered log lines, suitable for printing.
+    """
+    filtered_lines = []
+    for line in logs.splitlines():
+        m = re.search(r"(Task\(\d+,[^\)]*\).*?bw=[\d\.]+GB/s)", line)
+        if m:
+            filtered_lines.append(m.group(1))
+    return "\n".join(filtered_lines)
+
+
+def embed(hashes, block_layer_size, block_layer):
+    """
+    Execute UC embedding (writing KVCache blocks) operation and measure bandwidth.
+
+    Args:
+        hashes (list[str]): List of block hashes to embed.
+        block_layer_size (int): Size of each block layer in bytes.
+        block_layer (int): Number of layers per block.
+
+    Returns:
+        float | None: Average bandwidth in GB/s, or None if no valid bw found.
+
+    Raises:
+        RuntimeError: If any UC operation fails.
+    """
+    with StdoutInterceptor() as cap:
+        # Allocate blocks in UC
+        ret = ucmstore.AllocBatch(hashes)
+        if sum(ret) != 0:
+            raise RuntimeError(f"ucmstore.AllocBatch failed: sum(ret)={sum(ret)} != 0")
+
+        block_number = len(hashes)
+        buffers = ucmstore.MakeHostBuffers(block_layer_size, block_layer * block_number)
+        if len(buffers) == 0:
+            raise RuntimeError("ucmstore.MakeHostBuffers failed: no buffers allocated")
+
+        # Prepare data for DumpFromHost
+        data_id, data_off, data_addr, data_len = [], [], [], []
+        for block_idx in range(block_number):
+            offset = 0
+            for layer_idx in range(block_layer):
+                data_id.append(hashes[block_idx])
+                data_off.append(offset)
+                data_addr.append(buffers[block_idx * block_layer + layer_idx])
+                data_len.append(block_layer_size)
+                offset += block_layer_size
+
+        # Dump data to UC
+        task_id = ucmstore.DumpFromHost(data_id, data_off, data_addr, data_len)
+        if task_id <= 0:
+            raise RuntimeError(
+                f"ucmstore.DumpFromHost failed: invalid task_id={task_id}"
+            )
+
+        # Wait for completion
+        ret = ucmstore.Wait(task_id)
+        if ret != 0:
+            raise RuntimeError(
+                f"ucmstore.Wait failed for embed task_id={task_id}, ret={ret}"
+            )
+
+        # Release host buffers and commit
+        ucmstore.ReleaseHostBuffers(buffers)
+        ucmstore.CommitBatch(hashes, True)
+
+    logs = cap.read()
+    print(filter_task_logs(logs))
+
+    # Extract average bandwidth
+    bw_list = [float(x) for x in re.findall(r"bw=([\d\.]+)GB/s", logs)]
+    avg_bw = sum(bw_list) / len(bw_list) if bw_list else None
+    return avg_bw
+
+
+def fetch(hashes, block_layer_size, block_layer):
+    """
+    Execute UC fetching (reading KVCache blocks) operation and measure bandwidth.
+
+    Args:
+        hashes (list[str]): List of block hashes to fetch.
+        block_layer_size (int): Size of each block layer in bytes.
+        block_layer (int): Number of layers per block.
+
+    Returns:
+        float | None: Average bandwidth in GB/s, or None if no valid bw found.
+
+    Raises:
+        RuntimeError: If any UC operation fails.
+    """
+    with StdoutInterceptor() as cap:
+        block_number = len(hashes)
+        results = ucmstore.LookupBatch(hashes)
+        if not all(results):
+            raise RuntimeError("ucmstore.LookupBatch failed: some blocks not found")
+
+        buffers = ucmstore.MakeHostBuffers(block_layer_size, block_layer * block_number)
+        if len(buffers) == 0:
+            raise RuntimeError("ucmstore.MakeHostBuffers failed: no buffers allocated")
+
+        # Prepare data for LoadToHost
+        data_id, data_off, data_addr, data_len = [], [], [], []
+        for block_idx in range(block_number):
+            offset = 0
+            for layer_idx in range(block_layer):
+                data_id.append(hashes[block_idx])
+                data_off.append(offset)
+                data_addr.append(buffers[block_idx * block_layer + layer_idx])
+                data_len.append(block_layer_size)
+                offset += block_layer_size
+
+        # Load data from UC
+        task_id = ucmstore.LoadToHost(data_id, data_off, data_addr, data_len)
+        if task_id <= 0:
+            raise RuntimeError("ucmstore.LoadToHost failed: invalid task_id")
+
+        # Wait for completion
+        ret = ucmstore.Wait(task_id)
+        if ret != 0:
+            raise RuntimeError(
+                f"ucmstore.Wait failed for fetch task_id={task_id}, ret={ret}"
+            )
+
+        # Release buffers
+        ucmstore.ReleaseHostBuffers(buffers)
+
+    logs = cap.read()
+    print(filter_task_logs(logs))
+
+    # Extract average bandwidth
+    bw_list = [float(x) for x in re.findall(r"bw=([\d\.]+)GB/s", logs)]
+    avg_bw = sum(bw_list) / len(bw_list) if bw_list else None
+    return avg_bw
+
+
+# ========= Bandwidth Check =========
+def run_bandwidth_check():
+    """
+    Run UC embedding and fetching operations on KVCache blocks,
+    measure bandwidth for each batch, and calculate overall average.
+
+    Returns:
+        dict: Summary of average bandwidth for 'embed' and 'fetch' in GB/s.
+    """
+    # UC block and layer configuration
+    block_dim = 576
+    block_len = 128
+    block_elem_size = 2
+    block_layer = 61
+    block_layer_size = block_dim * block_len * block_elem_size
+    block_size = block_layer_size * block_layer
+    batch_size = 256
+
+    setup_uc(block_size)
+    hashes = [secrets.token_hex(16) for _ in range(KVCACHE_BLOCK_NUMBER)]
+    total_batches = (KVCACHE_BLOCK_NUMBER + batch_size - 1) // batch_size
+
+    bw_summary = {"embed": [], "fetch": []}
+
+    print("\n----------------------------------------")
+    print("[UC] Start embed batch and fetch batch. Processing KVCache blocks...")
+
+    # Embed batches
+    for batch in range(total_batches):
+        start = batch_size * batch
+        end = min(start + batch_size, KVCACHE_BLOCK_NUMBER)
+        avg_bw = embed(hashes[start:end], block_layer_size, block_layer)
+        if avg_bw:
+            bw_summary["embed"].append(avg_bw)
+
+    print("[UC] Start fetch batch. Processing KVCache blocks...")
+    # Fetch batches
+    for batch in range(total_batches):
+        start = batch_size * batch
+        end = min(start + batch_size, KVCACHE_BLOCK_NUMBER)
+        avg_bw = fetch(hashes[start:end], block_layer_size, block_layer)
+        if avg_bw:
+            bw_summary["fetch"].append(avg_bw)
+
+    # Calculate overall average bandwidth
+    for key in bw_summary:
+        if bw_summary[key]:
+            bw_summary[key] = sum(bw_summary[key]) / len(bw_summary[key])
+        else:
+            bw_summary[key] = None
+
+    return bw_summary
diff --git a/test/common/uc_eval/utils/metric.py b/test/common/uc_eval/utils/metric.py
index b6b0b8004..273604e80 100644
--- a/test/common/uc_eval/utils/metric.py
+++ b/test/common/uc_eval/utils/metric.py
@@ -72,7 +72,7 @@ def match(
         self,
         expected_output: Union[str, List[str], tuple[str]],
         real_output: str,
-        **kwargs
+        **kwargs,
     ):
         pass
 
diff --git a/test/config.yaml b/test/config.yaml
index f61793c31..3d2f809c0 100644
--- a/test/config.yaml
+++ b/test/config.yaml
@@ -32,4 +32,54 @@ llm_connection:
   tokenizer_path: "/home/models/QwQ-32B"
   stream: true    # stream output
   ignore_eos: true    # Ignore the returned terminator
-  timeout: 180    # request time out
\ No newline at end of file
+  timeout: 180    # request time out
+
+reports:
+  base_dir: "results/reports"
+  use_timestamp: true
+  directory_prefix: "pytest"
+  html: # pytest-html
+    enabled: true
+    filename: "report.html"
+    title: "UCM Pytest Test Report"
+
+database:
+  backup: "results/"
+  enabled: true
+  host: "127.0.0.1"
+  port: 3306
+  name: "ucm_pytest"
+  user: "root"
+  password: "123456"
+  charset: "utf8mb4"
+
+models:
+  ip_ports: ""
+  tokenizer_path: ""
+  served_model_name: ""
+  payload: ''
+  enable_clear_hbm: false
+
+
+# LLM Connection Configuration
+llm_connection:
+  model: "qwen3"
+  server_url: "http://141.111.32.70:9382"
+  tokenizer_path: "/home/models/QwQ-32B"
+  stream: true    # stream output
+  ignore_eos: true    # Ignore the returned terminator
+  timeout: 180    # request time out
+
+# Environment Pre-Check Configuration
+Env_preCheck:
+  master_ip: 141.111.32.70
+  worker_ip: 141.111.32.72
+  ascend_rt_visible_devices: "0,1"
+  node_num: 2
+  model_path: "/home/models/QwQ-32B"
+  hf_model_name: "QwQ-32B"
+  middle_page: "Qwen"
+  expected_embed_bandwidth: 10
+  expected_fetch_bandwidth: 10
+  kvCache_block_number: 1024
+  storage_backends: ["/home/menglong/data"]
\ No newline at end of file
diff --git a/test/pytest.ini b/test/pytest.ini
index 4be3cf477..16643b39f 100644
--- a/test/pytest.ini
+++ b/test/pytest.ini
@@ -18,8 +18,8 @@ norecursedirs = .git venv env __pycache__ *.egg
 
 markers =
     # -------- Levels (Required) --------
-    stage(n): Unit/Smoke/Regression/Release (0=Unit 1=Smoke 2=Regression 3=Release)
+    stage: Unit/Smoke/Regression/Release (0=Unit 1=Smoke 2=Regression 3=Release)
     # -------- Features (Recommended) --------
     feature:     Feature tag
-    platform(name): Platform tag(gpu/npu)
+    platform: Platform tag(gpu/npu)
 # end of markers
\ No newline at end of file
diff --git a/test/suites/E2E/test_environment_precheck.py b/test/suites/E2E/test_environment_precheck.py
new file mode 100644
index 000000000..355652894
--- /dev/null
+++ b/test/suites/E2E/test_environment_precheck.py
@@ -0,0 +1,266 @@
+from pathlib import Path
+
+import pytest
+import yaml
+from common.envPreCheck.run_env_preCheck import (
+    LOCAL_SSH_KEY,
+    MASTER_IP,
+    WORKER_IP,
+    run_bandwidth_check,
+    run_check_hccn_ping,
+    run_check_model_weight,
+    run_check_nvidia_ping,
+    run_hccn_device_status_check,
+    run_hccn_tls_check,
+    run_nvidia_device_status_check,
+    run_set_ssh_login,
+)
+
+
+# ========= Environment Setup =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_ssh_login")
+def test_ssh_login():
+    """
+    Load environment variables from file and configure SSH login.
+    Dynamically generates value_lists based on ssh_result content.
+
+    Returns:
+        dict: SSH check result in value_lists format
+    """
+    ssh_result = run_set_ssh_login()
+
+    value_lists = {}
+
+    # Dynamically iterate through ssh_result to generate value_lists
+    for key, value in ssh_result.items():
+        # Structure like {"MASTER_IP": {"ip": "...", "status": True}}
+        if isinstance(value, dict) and "status" in value:
+            value_lists[f"SSH_CHECK_{key}"] = value["status"]
+
+        # Structure like {"SSH_CHECK": True}
+        elif isinstance(value, bool):
+            value_lists[key] = value
+
+        else:
+            continue
+
+    # Ensure SSH_CHECK itself must pass
+    assert ssh_result.get("SSH_CHECK", False) is True, f"SSH login failed: {ssh_result}"
+
+
+# ========= Device Status Check =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_check_hccn_device_status")
+def test_hccn_check_device_status():
+    """
+    Check the status of all devices in the cluster.
+    Dynamically generates value_lists based on device_status content.
+
+    Returns:
+        dict: Device status check result in value_lists format
+    """
+    device_status = run_hccn_device_status_check()
+
+    value_lists = {}
+
+    # Dynamically iterate through device_status, add to value_lists when status is found
+    for key, value in device_status.items():
+        if isinstance(value, dict) and "status" in value:
+            value_lists[key] = [value["status"]]
+
+    # Overall validation
+    assert (
+        device_status.get("device_status_check", {}).get("status", False) is True
+    ), f"Device status check failed: {device_status}"
+
+
+@pytest.mark.stage(1)
+@pytest.mark.platform("gpu")
+@pytest.mark.feature("test_check_nvidia_device_status")
+def test_nvidia_check_device_status():
+    """
+    Check the status of all devices in the cluster.
+    Dynamically generates value_lists based on device_status content.
+
+    Returns:
+        dict: Device status check result in value_lists format
+    """
+    device_status = run_nvidia_device_status_check()
+
+    value_lists = {}
+
+    # Dynamically iterate through device_status, add to value_lists when status is found
+    for key, value in device_status.items():
+        if isinstance(value, dict) and "status" in value:
+            value_lists[key] = [value["status"]]
+
+    # Overall validation
+    assert (
+        device_status.get("device_status_check", {}).get("status", False) is True
+    ), f"Device status check failed: {device_status}"
+
+
+# ========= Ping Connectivity Check =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_check_ascend_ping")
+def test_check_hccn_ping():
+    """
+    Perform ping connectivity check for the detected environment type (ASCEND).
+
+    Returns:
+        dict: Ping check result with dynamic value_lists
+    """
+    ping_result = run_check_hccn_ping()
+
+    # Dynamic value_lists container
+    value_lists = {}
+
+    # 1Add all keys except the summary key (hccn_ping_check)
+    for key, info in ping_result.items():
+        if key == "hccn_ping_check":
+            continue
+        value_lists[key] = [info.get("status", False)]
+
+    # Add final summary ping check key as the last entry
+    final_status = ping_result.get("hccn_ping_check", {}).get("status", False)
+    value_lists["hccn_ping_check"] = [final_status]
+
+    # Assertion: final summary must pass
+    assert final_status is True, f"ASCEND ping failed: {ping_result}"
+
+
+@pytest.mark.stage(1)
+@pytest.mark.platform("gpu")
+@pytest.mark.feature("test_check_nvidia_ping")
+def test_check_nvidia_ping():
+    """
+    Perform ping connectivity check for the detected environment type (NVIDIA).
+
+    Returns:
+        dict: Ping check result with dynamic value_lists
+    """
+    ping_result = run_check_nvidia_ping()
+
+    # Dynamic value_lists container
+    value_lists = {}
+
+    # 1Add all keys except the summary key (nvidia_ping_check)
+    for key, info in ping_result.items():
+        if key == "nvidia_ping_check":
+            continue
+        value_lists[key] = [info.get("status", False)]
+
+    # Add final summary ping check key as the last entry
+    final_status = ping_result.get("nvidia_ping_check", {}).get("status", False)
+    value_lists["nvidia_ping_check"] = [final_status]
+
+    # Assertion: final summary must pass
+    assert final_status is True, f"NVIDIA ping failed: {ping_result}"
+
+
+# ========= TLS Connectivity Check =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_check_tls")
+def test_check_tls():
+    """
+    Check TLS switch status of all HCCN cards on master and worker nodes.
+    Dynamically build value_lists based on tls_result content.
+
+    Returns:
+        dict: TLS check result stored inside value_lists
+    """
+    tls_result = run_hccn_tls_check(MASTER_IP, WORKER_IP)
+
+    tls_data = tls_result.get("tls_check", {})
+    value_lists = {}
+
+    # Dynamically extract each field and its status
+    for key, entry in tls_data.items():
+        if key == "status":
+            continue
+        else:
+            # Each card's status
+            value_lists[key] = [entry.get("status", False)]
+
+    value_lists["tls_check"] = [tls_data.get("status", False)]
+
+    # Assert overall TLS status
+    assert tls_data.get("status", False) is True, f"TLS check failed: {tls_result}"
+
+
+# ========= Model Weight Files Check =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_check_model_weights")
+def test_check_model_weights():
+    """
+    Verify the existence and correctness of model weight files.
+
+    Returns:
+        dict: Model weight check result with dynamic value_lists
+    """
+
+    model_weight = run_check_model_weight()
+
+    # Dynamic value_lists container
+    value_lists = {}
+
+    # Iterate through all top-level keys except "model_weight_check"
+    for key, info in model_weight.items():
+        if key == "model_weight_check":
+            continue
+        # Add status as list
+        value_lists[key] = [info.get("status", False)]
+
+    # Add model_weight_check as last field
+    final_status = model_weight.get("model_weight_check", {}).get("status", False)
+    value_lists["model_weight_check"] = [final_status]
+
+    # Final assertion
+    assert final_status is True, f"Model weight check failed: {model_weight}"
+
+
+# ========= Bandwidth Check =========
+@pytest.mark.stage(1)
+@pytest.mark.platform("npu")
+@pytest.mark.feature("test_check_bandwidth")
+def test_check_bandwidth():
+    """
+    Measure storage system bandwidth for embedding and fetching operations.
+    Dynamically generate value_lists from the returned bandwidth dict.
+
+    Returns:
+        dict: Bandwidth summary stored in value_lists format
+    """
+    bandwidth = run_bandwidth_check()
+    print("bandwidth", bandwidth)
+
+    value_lists = {}
+
+    # Dynamically generate key, e.g., embed → embed_avg_bandwidth
+    for key, val in bandwidth.items():
+        dynamic_key = f"{key}_avg_bandwidth"
+        value_lists[dynamic_key] = [val]
+
+    config_file = Path(__file__).parent.parent.parent / "config.yaml"
+    with open(config_file, "r", encoding="utf-8") as f:
+        config = yaml.safe_load(f)
+        EXPECTED_EMBED_BANDWIDTH = config.get("Env_preCheck", {}).get(
+            "expected_embed_bandwidth", ""
+        )
+        EXPECTED_FETCH_BANDWIDTH = config.get("Env_preCheck", {}).get(
+            "expected_fetch_bandwidth", ""
+        )
+
+    # Validation
+    assert (
+        bandwidth["embed"] < 0.85 * EXPECTED_EMBED_BANDWIDTH
+    ), f"Embed bandwidth too high: {bandwidth['embed']} GB/s"
+    assert (
+        bandwidth["fetch"] < 0.85 * EXPECTED_FETCH_BANDWIDTH
+    ), f"Fetch bandwidth too high: {bandwidth['fetch']} GB/s"