GPU Detection¶

`gpu` ¶

GPU detection, VRAM information, and CUDA version detection.

Replaces Test-NvidiaGpu and Get-GpuVramInfo from UmeAiRTUtils.psm1. Uses subprocess to call nvidia-smi (works on both Windows and Linux).

`GpuInfo(name, vram_gib, cuda_version=None)` `dataclass` ¶

Information about a detected NVIDIA GPU.

`detect_cuda_version()` ¶

Detect CUDA version from the NVIDIA driver.

Queries the driver version via nvidia-smi and maps it to the maximum supported CUDA toolkit version.

Returns:

Type	Description
`tuple[int, int] \| None`	`(major, minor)` tuple (e.g. `(13, 0)`), or `None`.

Source code in src/utils/gpu.py

def detect_cuda_version() -> tuple[int, int] | None:
    """Detect CUDA version from the NVIDIA driver.

    Queries the driver version via ``nvidia-smi`` and maps it to the
    maximum supported CUDA toolkit version.

    Returns:
        ``(major, minor)`` tuple (e.g. ``(13, 0)``), or ``None``.
    """
    try:
        result = subprocess.run(  # returncode checked below
            ["nvidia-smi", "--query-gpu=driver_version", "--format=csv,noheader,nounits"],
            capture_output=True,
            text=True,
            timeout=10,
        )
        if result.returncode != 0 or not result.stdout.strip():
            return None

        driver_str = result.stdout.strip().split("\n")[0].strip()
        driver_major = float(driver_str.split(".")[0])

        for min_driver, cuda_ver in _DRIVER_CUDA_MAP:
            if driver_major >= min_driver:
                return cuda_ver

        return None

    except (FileNotFoundError, subprocess.TimeoutExpired, ValueError, OSError):
        return None

`detect_nvidia_gpu(log=None)` ¶

Check for the presence of an NVIDIA GPU.

Returns:

Type	Description
`bool`	True if an NVIDIA GPU is detected, False otherwise.

Source code in src/utils/gpu.py

def detect_nvidia_gpu(log: InstallerLogger | None = None) -> bool:
    """
    Check for the presence of an NVIDIA GPU.

    Returns:
        True if an NVIDIA GPU is detected, False otherwise.
    """
    if log is None:
        log = get_logger()
    log.item("Checking for NVIDIA GPU...")

    try:
        result = subprocess.run(  # returncode checked below
            ["nvidia-smi", "-L"],
            capture_output=True,
            text=True,
            timeout=10,
        )
        if result.returncode == 0 and "GPU 0:" in result.stdout:
            log.sub("NVIDIA GPU detected.", style="success")
            log.info(result.stdout.strip().split("\n")[0])
            return True
        else:
            log.warning("No NVIDIA GPU detected. Skipping GPU-only packages.", level=1)
            return False
    except (FileNotFoundError, subprocess.TimeoutExpired, OSError):
        log.warning("'nvidia-smi' command failed. Assuming no GPU.", level=1)
        return False

`check_amd_gpu(log=None)` ¶

Check for the presence of an AMD GPU using OS-native commands.

Returns:

Type	Description
`bool`	True if an AMD GPU is detected, False otherwise.

Source code in src/utils/gpu.py

def check_amd_gpu(log: InstallerLogger | None = None) -> bool:
    """
    Check for the presence of an AMD GPU using OS-native commands.

    Returns:
        True if an AMD GPU is detected, False otherwise.
    """
    import platform

    if log is None:
        log = get_logger()
    log.item("Checking for AMD GPU...")

    if platform.system() == "Windows":
        try:
            result = subprocess.run(
                ["powershell", "-NoProfile", "-Command", "(Get-CimInstance Win32_VideoController).Name"],
                capture_output=True, text=True, check=True, timeout=10
            )
            lines = [line.strip() for line in result.stdout.splitlines() if line.strip()]
            for line in lines:
                if "AMD" in line.upper() or "RADEON" in line.upper():
                    log.sub(f"AMD GPU detected: {line}", style="success")
                    return True
            return False
        except Exception:
            return False

    elif platform.system() == "Linux":
        try:
            result = subprocess.run(
                ["lspci"],
                capture_output=True, text=True, check=True, timeout=10
            )
            is_amd = "Advanced Micro Devices" in result.stdout or "AMD" in result.stdout
            if is_amd:
                log.sub("AMD GPU detected.", style="success")
            return is_amd
        except Exception:
            return False

    return False

`get_gpu_vram_info()` ¶

Query NVIDIA GPU name and total VRAM.

Returns:

Type	Description
`GpuInfo \| None`	GpuInfo object with name, VRAM in GiB, and CUDA version, or None.

Source code in src/utils/gpu.py

def get_gpu_vram_info() -> GpuInfo | None:
    """
    Query NVIDIA GPU name and total VRAM.

    Returns:
        GpuInfo object with name, VRAM in GiB, and CUDA version, or None.
    """
    try:
        result = subprocess.run(  # returncode checked below
            ["nvidia-smi", "--query-gpu=name,memory.total", "--format=csv,noheader,nounits"],
            capture_output=True,
            text=True,
            timeout=10,
        )
        if result.returncode != 0 or not result.stdout.strip():
            return None

        parts = result.stdout.strip().split(",")
        if len(parts) < 2:
            return None

        name = parts[0].strip()
        memory_mib = int(parts[1].strip())
        memory_gib = round(memory_mib / 1024)
        cuda = detect_cuda_version()

        return GpuInfo(name=name, vram_gib=memory_gib, cuda_version=cuda)

    except (FileNotFoundError, subprocess.TimeoutExpired, ValueError, OSError):
        return None

`recommend_model_quality(vram_gib)` ¶

Recommend a model quality tier based on available VRAM.

Parameters:

Name	Type	Description	Default
`vram_gib`	`int`	Available VRAM in GiB.	required

Returns:

Type	Description
`str`	A recommendation string (e.g. "fp16", "GGUF Q4").

Source code in src/utils/gpu.py

def recommend_model_quality(vram_gib: int) -> str:
    """
    Recommend a model quality tier based on available VRAM.

    Args:
        vram_gib: Available VRAM in GiB.

    Returns:
        A recommendation string (e.g. "fp16", "GGUF Q4").
    """
    if vram_gib >= 30:
        return "fp16"
    elif vram_gib >= 18:
        return "fp8 or GGUF Q8"
    elif vram_gib >= 16:
        return "GGUF Q6"
    elif vram_gib >= 14:
        return "GGUF Q5"
    elif vram_gib >= 12:
        return "GGUF Q4"
    elif vram_gib >= 8:
        return "GGUF Q3"
    else:
        return "GGUF Q2"

`cuda_tag_from_version(cuda)` ¶

Map a CUDA version tuple to a supported cuda tag.

Parameters:

Name	Type	Description	Default
`cuda`	`tuple[int, int] \| None`	`(major, minor)` tuple, e.g. `(13, 0)`.	required

Returns:

Type	Description
`str \| None`	A tag like `"cu130"` or `"cu128"`, or `None` if unsupported.

Source code in src/utils/gpu.py

def cuda_tag_from_version(cuda: tuple[int, int] | None) -> str | None:
    """Map a CUDA version tuple to a supported cuda tag.

    Args:
        cuda: ``(major, minor)`` tuple, e.g. ``(13, 0)``.

    Returns:
        A tag like ``"cu130"`` or ``"cu128"``, or ``None`` if unsupported.
    """
    if cuda is None:
        return None
    major, minor = cuda
    if major >= 13:
        return "cu130"
    if major == 12 and minor >= 8:
        return "cu128"
    # Older CUDA — not supported
    return None

`display_gpu_recommendations(log=None)` ¶

Detect GPU and display VRAM-based model recommendations.

Returns:

Type	Description
`GpuInfo \| None`	The detected GpuInfo or None.

Source code in src/utils/gpu.py

def display_gpu_recommendations(log: InstallerLogger | None = None) -> GpuInfo | None:
    """
    Detect GPU and display VRAM-based model recommendations.

    Returns:
        The detected GpuInfo or None.
    """
    if log is None:
        log = get_logger()

    log.log("─" * 70, level=-2)
    log.item("Checking for NVIDIA GPU to provide model recommendations...", style="warning")

    gpu = get_gpu_vram_info()
    if gpu:
        log.item(f"GPU: {gpu.name}", style="success")
        log.item(f"VRAM: {gpu.vram_gib} GB", style="success")
        if gpu.cuda_version:
            log.item(f"CUDA: {gpu.cuda_version[0]}.{gpu.cuda_version[1]}", style="success")
        rec = recommend_model_quality(gpu.vram_gib)
        log.item(f"Recommendation: {rec}", style="cyan")
    else:
        if check_amd_gpu():
            log.item("AMD GPU detected.", style="success")
            log.item("Recommendation: GGUF models are generally recommended for AMD "
                     "without custom optimization.", style="cyan")
        else:
            log.item("No NVIDIA or AMD GPU detected. Please choose based on your hardware.", style="info")

    log.log("─" * 70, level=-2)
    return gpu

GPU Detection¶

gpu ¶

GpuInfo(name, vram_gib, cuda_version=None) dataclass ¶

detect_cuda_version() ¶

detect_nvidia_gpu(log=None) ¶

check_amd_gpu(log=None) ¶

get_gpu_vram_info() ¶

recommend_model_quality(vram_gib) ¶

cuda_tag_from_version(cuda) ¶

display_gpu_recommendations(log=None) ¶

`gpu` ¶

`GpuInfo(name, vram_gib, cuda_version=None)` `dataclass` ¶

`detect_cuda_version()` ¶

`detect_nvidia_gpu(log=None)` ¶

`check_amd_gpu(log=None)` ¶

`get_gpu_vram_info()` ¶

`recommend_model_quality(vram_gib)` ¶

`cuda_tag_from_version(cuda)` ¶

`display_gpu_recommendations(log=None)` ¶