515.86.01

2026-01-30 04:59:46 +00:00 · 2022-11-22 10:04:21 -08:00
parent fe0728787f
commit c700e8f91c
34 changed files with 368 additions and 108 deletions
--- a/kernel-open/Kbuild
+++ b/kernel-open/Kbuild
@@ -72,7 +72,7 @@ EXTRA_CFLAGS += -I$(src)/common/inc
 EXTRA_CFLAGS += -I$(src)
 EXTRA_CFLAGS += -Wall -MD $(DEFINES) $(INCLUDES) -Wno-cast-qual -Wno-error -Wno-format-extra-args
 EXTRA_CFLAGS += -D__KERNEL__ -DMODULE -DNVRM
-EXTRA_CFLAGS += -DNV_VERSION_STRING=\"515.76\"
+EXTRA_CFLAGS += -DNV_VERSION_STRING=\"515.86.01\"

 EXTRA_CFLAGS += -Wno-unused-function

--- a/kernel-open/common/inc/nv.h
+++ b/kernel-open/common/inc/nv.h
@@ -628,7 +628,7 @@ static inline NvBool IS_REG_OFFSET(nv_state_t *nv, NvU64 offset, NvU64 length)
 {
    return ((offset >= nv->regs->cpu_address) &&

-
+            ((offset + (length - 1)) >= offset) &&

            ((offset + (length - 1)) <= (nv->regs->cpu_address + (nv->regs->size - 1))));
 }
@@ -637,7 +637,7 @@ static inline NvBool IS_FB_OFFSET(nv_state_t *nv, NvU64 offset, NvU64 length)
 {
    return  ((nv->fb) && (offset >= nv->fb->cpu_address) &&

-
+             ((offset + (length - 1)) >= offset) &&

             ((offset + (length - 1)) <= (nv->fb->cpu_address + (nv->fb->size - 1))));
 }
@@ -647,7 +647,7 @@ static inline NvBool IS_UD_OFFSET(nv_state_t *nv, NvU64 offset, NvU64 length)
    return ((nv->ud.cpu_address != 0) && (nv->ud.size != 0) &&
            (offset >= nv->ud.cpu_address) &&

-
+            ((offset + (length - 1)) >= offset) &&

            ((offset + (length - 1)) <= (nv->ud.cpu_address + (nv->ud.size - 1))));
 }
@@ -658,7 +658,7 @@ static inline NvBool IS_IMEM_OFFSET(nv_state_t *nv, NvU64 offset, NvU64 length)
            (nv->bars[NV_GPU_BAR_INDEX_IMEM].size != 0) &&
            (offset >= nv->bars[NV_GPU_BAR_INDEX_IMEM].cpu_address) &&

-
+            ((offset + (length - 1)) >= offset) &&

            ((offset + (length - 1)) <= (nv->bars[NV_GPU_BAR_INDEX_IMEM].cpu_address +
                                         (nv->bars[NV_GPU_BAR_INDEX_IMEM].size - 1))));
--- a/kernel-open/conftest.sh
+++ b/kernel-open/conftest.sh
@@ -5268,7 +5268,7 @@ compile_test() {
            # Determine if 'num_registered_fb' variable is present.
            #
            # 'num_registered_fb' was removed by commit 5727dcfd8486
-            # ("fbdev: Make registered_fb[] private to fbmem.c) for
+            # ("fbdev: Make registered_fb[] private to fbmem.c") for
            # v5.20 linux-next (2022-07-27).
            #
            CODE="
@@ -5280,6 +5280,31 @@ compile_test() {
            compile_check_conftest "$CODE" "NV_NUM_REGISTERED_FB_PRESENT" "" "types"
        ;;

+        acpi_video_backlight_use_native)
+            #
+            # Determine if acpi_video_backlight_use_native() function is present
+            #
+            # acpi_video_backlight_use_native was added by commit 2600bfa3df99
+            # (ACPI: video: Add acpi_video_backlight_use_native() helper) for
+            # v6.0 (2022-08-17). Note: the include directive for <linux/types.h>
+            # in this conftest is necessary in order to support kernels between
+            # commit 0b9f7d93ca61 ("ACPI / i915: ignore firmware requests for
+            # backlight change") for v3.16 (2014-07-07) and commit 3bd6bce369f5
+            # ("ACPI / video: Port to new backlight interface selection API")
+            # for v4.2 (2015-07-16). Kernels within this range use the 'bool'
+            # type and the related 'false' value in <acpi/video.h> without first
+            # including the definitions of that type and value.
+            #
+            CODE="
+            #include <linux/types.h>
+            #include <acpi/video.h>
+            void conftest_acpi_video_backglight_use_native(void) {
+                acpi_video_backlight_use_native(0);
+            }"
+
+            compile_check_conftest "$CODE" "NV_ACPI_VIDEO_BACKLIGHT_USE_NATIVE" "" "functions"
+        ;;
+
        # When adding a new conftest entry, please use the correct format for
        # specifying the relevant upstream Linux kernel commit.
        #
--- a/kernel-open/nvidia-drm/nvidia-drm-gem-nvkms-memory.c
+++ b/kernel-open/nvidia-drm/nvidia-drm-gem-nvkms-memory.c
@@ -95,7 +95,11 @@ static vm_fault_t __nv_drm_gem_nvkms_handle_vma_fault(
        pfn >>= PAGE_SHIFT;
        pfn += page_offset;
    } else {
-        BUG_ON(page_offset > nv_nvkms_memory->pages_count);
+
+        BUG_ON(page_offset >= nv_nvkms_memory->pages_count);
+
+
+
        pfn = page_to_pfn(nv_nvkms_memory->pages[page_offset]);
    }

--- a/kernel-open/nvidia-drm/nvidia-drm-gem-user-memory.c
+++ b/kernel-open/nvidia-drm/nvidia-drm-gem-user-memory.c
@@ -112,7 +112,11 @@ static vm_fault_t __nv_drm_gem_user_memory_handle_vma_fault(

    page_offset = vmf->pgoff - drm_vma_node_start(&gem->vma_node);

-    BUG_ON(page_offset > nv_user_memory->pages_count);
+
+    BUG_ON(page_offset >= nv_user_memory->pages_count);
+
+
+

    ret = vm_insert_page(vma, address, nv_user_memory->pages[page_offset]);
    switch (ret) {
--- a/kernel-open/nvidia-drm/nvidia-drm-linux.c
+++ b/kernel-open/nvidia-drm/nvidia-drm-linux.c
@@ -47,6 +47,16 @@ module_param_named(modeset, nv_drm_modeset_module_param, bool, 0400);

 void *nv_drm_calloc(size_t nmemb, size_t size)
 {
+
+    size_t total_size = nmemb * size;
+    //
+    // Check for overflow.
+    //
+    if ((nmemb != 0) && ((total_size / nmemb) != size))
+    {
+        return NULL;
+    }
+
    return kzalloc(nmemb * size, GFP_KERNEL);
 }

--- a/kernel-open/nvidia-modeset/nvidia-modeset-linux.c
+++ b/kernel-open/nvidia-modeset/nvidia-modeset-linux.c
@@ -35,6 +35,8 @@
 #include <linux/list.h>
 #include <linux/rwsem.h>

+#include <acpi/video.h>
+
 #include "nvstatus.h"

 #include "nv-register-module.h"
@@ -1060,6 +1062,12 @@ nvkms_register_backlight(NvU32 gpu_id, NvU32 display_id, void *drv_priv,
    struct nvkms_backlight_device *nvkms_bd = NULL;
    int i;

+#if defined(NV_ACPI_VIDEO_BACKLIGHT_USE_NATIVE)
+    if (!acpi_video_backlight_use_native()) {
+        return NULL;
+    }
+#endif
+
    gpu_info = nvkms_alloc(NV_MAX_GPUS * sizeof(*gpu_info), NV_TRUE);
    if (gpu_info == NULL) {
        return NULL;
--- a/kernel-open/nvidia-modeset/nvidia-modeset.Kbuild
+++ b/kernel-open/nvidia-modeset/nvidia-modeset.Kbuild
@@ -96,4 +96,5 @@ NV_CONFTEST_FUNCTION_COMPILE_TESTS += kthread_create_on_node
 NV_CONFTEST_FUNCTION_COMPILE_TESTS += list_is_first
 NV_CONFTEST_FUNCTION_COMPILE_TESTS += ktime_get_real_ts64
 NV_CONFTEST_FUNCTION_COMPILE_TESTS += ktime_get_raw_ts64
+NV_CONFTEST_FUNCTION_COMPILE_TESTS += acpi_video_backlight_use_native
 NV_CONFTEST_SYMBOL_COMPILE_TESTS += is_export_symbol_present_kthread_create_on_node
--- a/kernel-open/nvidia/nv-dmabuf.c
+++ b/kernel-open/nvidia/nv-dmabuf.c
@@ -26,6 +26,15 @@


 #if defined(CONFIG_DMA_SHARED_BUFFER)
+
+//
+// The Linux kernel's dma_length in struct scatterlist is unsigned int
+// which limits the maximum sg length to 4GB - 1.
+// To get around this limitation, the BAR1 scatterlist returned by RM
+// is split into (4GB - PAGE_SIZE) sized chunks to build the sg_table.
+//
+#define NV_DMA_BUF_SG_MAX_LEN         ((NvU32)(NVBIT64(32) - PAGE_SIZE))
+
 typedef struct nv_dma_buf_mem_handle
 {
    NvHandle h_memory;
@@ -259,26 +268,36 @@ nv_dma_buf_unmap_unlocked(
    nv_dma_device_t *peer_dma_dev,
    nv_dma_buf_file_private_t *priv,
    struct sg_table *sgt,
-    NvU32 count
+    NvU32 mapped_handle_count
 )
 {
    NV_STATUS status;
    NvU32 i;
    NvU64 dma_len;
    NvU64 dma_addr;
-    NvU64 bar1_va;
    NvBool bar1_unmap_needed;
    struct scatterlist *sg = NULL;

    bar1_unmap_needed = (priv->bar1_va_ref_count == 0);

-    for_each_sg(sgt->sgl, sg, count, i)
+    sg = sgt->sgl;
+    for (i = 0; i < mapped_handle_count; i++)
    {
-        dma_addr = sg_dma_address(sg);
-        dma_len  = priv->handles[i].size;
-        bar1_va  = priv->handles[i].bar1_va;
+        NvU64 handle_size = priv->handles[i].size;

-        WARN_ON(sg_dma_len(sg) != priv->handles[i].size);
+        dma_addr = sg_dma_address(sg);
+        dma_len  = 0;
+
+        //
+        // Seek ahead in the scatterlist until the handle size is covered.
+        // IOVA unmap can then be done all at once instead of doing it
+        // one sg at a time.
+        //
+        while(handle_size != dma_len)
+        {
+            dma_len += sg_dma_len(sg);
+            sg = sg_next(sg);
+        }

        nv_dma_unmap_peer(peer_dma_dev, (dma_len / os_page_size), dma_addr);

@@ -309,7 +328,8 @@ nv_dma_buf_map(
    nv_dma_device_t peer_dma_dev = {{ 0 }};
    NvBool bar1_map_needed;
    NvBool bar1_unmap_needed;
-    NvU32 count = 0;
+    NvU32 mapped_handle_count = 0;
+    NvU32 num_sg_entries = 0;
    NvU32 i = 0;
    int rc = 0;

@@ -361,13 +381,23 @@ nv_dma_buf_map(
    }

    memset(sgt, 0, sizeof(struct sg_table));
+    //
+    // Pre-calculate number of sg entries we need based on handle size.
+    // This is needed to allocate sg_table.
+    //
+    for (i = 0; i < priv->num_objects; i++)
+    {
+        NvU64 count = priv->handles[i].size + NV_DMA_BUF_SG_MAX_LEN - 1;
+        do_div(count, NV_DMA_BUF_SG_MAX_LEN);
+        num_sg_entries += count;
+    }

    //
    // RM currently returns contiguous BAR1, so we create as many
-    // sg entries as the number of handles being mapped.
+    // sg entries as num_sg_entries calculated above.
    // When RM can alloc discontiguous BAR1, this code will need to be revisited.
    //
-    rc = sg_alloc_table(sgt, priv->num_objects, GFP_KERNEL);
+    rc = sg_alloc_table(sgt, num_sg_entries, GFP_KERNEL);
    if (rc != 0)
    {
        goto free_sgt;
@@ -377,7 +407,8 @@ nv_dma_buf_map(
    peer_dma_dev.addressable_range.limit = (NvU64)dev->dma_mask;
    bar1_map_needed = bar1_unmap_needed = (priv->bar1_va_ref_count == 0);

-    for_each_sg(sgt->sgl, sg, priv->num_objects, i)
+    sg = sgt->sgl;
+    for (i = 0; i < priv->num_objects; i++)
    {
        NvU64 dma_addr;
        NvU64 dma_len;
@@ -395,9 +426,15 @@ nv_dma_buf_map(
            }
        }

+        mapped_handle_count++;
+
        dma_addr = priv->handles[i].bar1_va;
        dma_len  = priv->handles[i].size;

+        //
+        // IOVA map the full handle at once and then breakdown the range
+        // (dma_addr, dma_addr + dma_len) into smaller sg entries.
+        //
        status = nv_dma_map_peer(&peer_dma_dev, priv->nv->dma_dev,
                                 0x1, (dma_len / os_page_size), &dma_addr);
        if (status != NV_OK)
@@ -411,14 +448,23 @@ nv_dma_buf_map(
                                                   priv->handles[i].bar1_va);
            }

+            mapped_handle_count--;
+
            // Unmap remaining memory handles
            goto unmap_handles;
        }

-        sg_set_page(sg, NULL, dma_len, 0);
-        sg_dma_address(sg) = (dma_addr_t)dma_addr;
-        sg_dma_len(sg) = dma_len;
-        count++;
+        while(dma_len != 0)
+        {
+            NvU32 sg_len = NV_MIN(dma_len, NV_DMA_BUF_SG_MAX_LEN);
+
+            sg_set_page(sg, NULL, sg_len, 0);
+            sg_dma_address(sg) = (dma_addr_t)dma_addr;
+            sg_dma_len(sg) = sg_len;
+            dma_addr += sg_len;
+            dma_len -= sg_len;
+            sg = sg_next(sg);
+        }
    }

    priv->bar1_va_ref_count++;
@@ -434,7 +480,7 @@ nv_dma_buf_map(
    return sgt;

 unmap_handles:
-    nv_dma_buf_unmap_unlocked(sp, &peer_dma_dev, priv, sgt, count);
+    nv_dma_buf_unmap_unlocked(sp, &peer_dma_dev, priv, sgt, mapped_handle_count);

    sg_free_table(sgt);

@@ -821,12 +867,12 @@ nv_dma_buf_reuse(
    }


+    if ((priv->total_objects < params->numObjects) ||
+        (params->index > (priv->total_objects - params->numObjects)))



-    if (params->index > (priv->total_objects - params->numObjects))
    {
-
        status = NV_ERR_INVALID_ARGUMENT;
        goto unlock_priv;
    }
--- a/kernel-open/nvidia/nv-mmap.c
+++ b/kernel-open/nvidia/nv-mmap.c
@@ -133,10 +133,10 @@ nvidia_vma_access(
    pageOffset = (addr & ~PAGE_MASK);


-
-
-
-
+    if (length < 0)
+    {
+        return -EINVAL;
+    }


    if (!mmap_context->valid)
@@ -217,8 +217,19 @@ static vm_fault_t nvidia_fault(

    NvU64 page;
    NvU64 num_pages = NV_VMA_SIZE(vma) >> PAGE_SHIFT;
-    NvU64 pfn_start =
-        (nvlfp->mmap_context.mmap_start >> PAGE_SHIFT) + vma->vm_pgoff;
+
+    NvU64 pfn_start = (nvlfp->mmap_context.mmap_start >> PAGE_SHIFT);
+
+
+
+
+
+
+    if (vma->vm_pgoff != 0)
+    {
+        return VM_FAULT_SIGBUS;
+    }
+

    // Mapping revocation is only supported for GPU mappings.
    if (NV_IS_CTL_DEVICE(nv))
@@ -490,6 +501,13 @@ int nvidia_mmap_helper(
        return -EINVAL;
    }

+
+    if (vma->vm_pgoff != 0)
+    {
+        return -EINVAL;
+    }
+
+
    NV_PRINT_VMA(NV_DBG_MEMINFO, vma);

    status = nv_check_gpu_state(nv);
@@ -517,11 +535,11 @@ int nvidia_mmap_helper(
        NvU64 access_len = mmap_context->access_size;


-
-
-
-
-
+        // validate the size
+        if (NV_VMA_SIZE(vma) != mmap_length)
+        {
+            return -ENXIO;
+        }

        if (IS_REG_OFFSET(nv, access_start, access_len))
        {
--- a/kernel-open/nvidia/nv.c
+++ b/kernel-open/nvidia/nv.c
@@ -1468,8 +1468,8 @@ static int nv_open_device(nv_state_t *nv, nvidia_stack_t *sp)
    }


-
-
+    if (unlikely(NV_ATOMIC_READ(nvl->usage_count) >= NV_S32_MAX))
+        return -EMFILE;


    if ( ! (nv->flags & NV_FLAG_OPEN))
--- a/kernel-open/nvidia/nvlink_linux.c
+++ b/kernel-open/nvidia/nvlink_linux.c
@@ -208,8 +208,8 @@ static int nvlink_fops_release(struct inode *inode, struct file *filp)
    nvlink_print(NVLINK_DBG_INFO, "nvlink driver close\n");


-
-
+    if (private == NULL)
+        return -ENOMEM;


    mutex_lock(&nvlink_drvctx.lock);