580.65.06

2026-02-02 22:47:25 +00:00 · 2025-08-04 11:15:02 -07:00
parent d890313300
commit 307159f262
1315 changed files with 477791 additions and 279973 deletions
--- a/kernel-open/nvidia-uvm/uvm_va_block.h
+++ b/kernel-open/nvidia-uvm/uvm_va_block.h
@@ -1,5 +1,5 @@
 /*******************************************************************************
-    Copyright (c) 2015-2024 NVIDIA Corporation
+    Copyright (c) 2015-2025 NVIDIA Corporation

    Permission is hereby granted, free of charge, to any person obtaining a copy
    of this software and associated documentation files (the "Software"), to
@@ -205,12 +205,12 @@ typedef struct
    //
    // The indices represent the corresponding big PTEs in the block's interior.
    // For example, a block with alignment and size of one 4k page on either
-    // side of a big page will only use bit 0. Use uvm_va_block_big_page_index to look
-    // the big_ptes index of a page.
+    // side of a big page will only use bit 0. Use uvm_va_block_big_page_index
+    // to look up the big_ptes index of a page.
    //
    // The block might not be able to fit any big PTEs, in which case this
-    // bitmap is always zero. Use uvm_va_block_gpu_num_big_pages to find the number of
-    // valid bits in this mask.
+    // bitmap is always zero. Use uvm_va_block_gpu_num_big_pages to find the
+    // number of valid bits in this mask.
    DECLARE_BITMAP(big_ptes, MAX_BIG_PAGES_PER_UVM_VA_BLOCK);

    // See the comments for uvm_va_block_mmap_t::cpu.pte_bits.
@@ -317,6 +317,17 @@ struct uvm_va_block_struct
    // to pages resident on other processors.
    uvm_processor_mask_t resident;

+    // Page mask tracking the set of block pages which have been discarded.
+    //
+    // Pages in this mask must be cleared if they are either migrated or
+    // evicted.
+    uvm_page_mask_t discarded_pages;
+
+    // The set of processors on which the VA block has ever been fully
+    // resident. This is used when determining whether GPU chunks need to
+    // zeroed.
+    uvm_processor_mask_t ever_fully_resident;
+
    // Per-processor mapping bit vector, used for fast lookup of which
    // processors are active in this block.
    //
@@ -468,6 +479,12 @@ struct uvm_va_block_struct
    // added to this tracker before the block's lock is dropped.
    uvm_tracker_t tracker;

+    // Track whether any new DMA mappings have been created under this block for
+    // each parent GPU without having been invalidated yet according to the
+    // rules described in uvm_dma_map_invalidation_t. The invalidation must
+    // happen before the DMA mappings are accessed by the GPU.
+    uvm_parent_processor_mask_t needs_phys_invalidate;
+
    // A queue item for establishing eviction mappings in a deferred way
    nv_kthread_q_item_t eviction_mappings_q_item;

@@ -565,8 +582,8 @@ struct uvm_va_block_wrapper_struct
        // testing only.
        bool inject_eviction_error;

-        // Force the next successful chunk allocation to then fail. Used for testing
-        // only to simulate driver metadata allocation failure.
+        // Force the next successful chunk allocation to then fail. Used for
+        // testing only to simulate driver metadata allocation failure.
        bool inject_populate_error;

        // Force the next split on this block to fail.
@@ -892,6 +909,18 @@ NV_STATUS uvm_va_block_map_mask(uvm_va_block_t *va_block,
                                uvm_prot_t new_prot,
                                UvmEventMapRemoteCause cause);

+// Map pages not already mapped on the destination processor after a migration.
+//
+// LOCKING: The VA block lock must be held. If va_block_context->mm !=
+//          NULL, va_block_context->mm->mmap_lock must be held in at least read
+//          mode.
+NV_STATUS uvm_va_block_migrate_map_mapped_pages(uvm_va_block_t *va_block,
+                                                uvm_va_block_retry_t *va_block_retry,
+                                                uvm_va_block_context_t *va_block_context,
+                                                uvm_va_block_region_t region,
+                                                uvm_processor_id_t dest_id,
+                                                UvmEventMapRemoteCause cause);
+
 // Unmaps virtual regions from a single processor. This does not free page
 // tables or physical memory. This is safe to call on the eviction path, but the
 // caller must ensure that the block hasn't been killed.
@@ -1030,6 +1059,13 @@ NV_STATUS uvm_va_block_check_logical_permissions(uvm_va_block_t *va_block,
                                                 uvm_fault_access_type_t access_type,
                                                 bool allow_migration);

+// Set a va_block discarded, unmap the block and revoke its residency status
+//
+// LOCKING: This takes and releases the VA block lock. If va_block_context->mm
+//          != NULL, va_block_context->mm->mmap_lock must be held in at least
+//          read mode.
+NV_STATUS uvm_va_block_discard(uvm_va_block_t *va_block, uvm_va_block_context_t *va_block_context, NvU64 flags);
+
 // API for access privilege revocation
 //
 // Revoke prot_to_revoke access permissions for the given processor.
@@ -1250,8 +1286,8 @@ NV_STATUS uvm_va_block_cpu_fault(uvm_va_block_t *va_block,
 // context.
 //
 // service_context must not be NULL and policy for service_context->region must
-// match. See the comments for uvm_va_block_check_policy_is_valid().  If
-// va_block is a HMM block, va_block_context->hmm.vma must be valid.  See the
+// match. See the comments for uvm_va_block_check_policy_is_valid(). If
+// va_block is a HMM block, va_block_context->hmm.vma must be valid. See the
 // comments for uvm_hmm_check_context_vma_is_valid() in uvm_hmm.h.
 // service_context->prefetch_hint is set by this function.
 //
@@ -1282,8 +1318,8 @@ NV_STATUS uvm_va_block_service_locked(uvm_processor_id_t processor_id,
 // pages to new_residency.
 //
 // service_context must not be NULL and policy for service_context->region must
-// match.  See the comments for uvm_va_block_check_policy_is_valid().  If
-// va_block is a HMM block, va_block_context->hmm.vma must be valid.  See the
+// match. See the comments for uvm_va_block_check_policy_is_valid(). If
+// va_block is a HMM block, va_block_context->hmm.vma must be valid. See the
 // comments for uvm_hmm_check_context_vma_is_valid() in uvm_hmm.h.
 // service_context->prefetch_hint should be set before calling this function.
 //
@@ -1311,8 +1347,8 @@ NV_STATUS uvm_va_block_service_copy(uvm_processor_id_t processor_id,
 // to the new residency (which may be remote).
 //
 // service_context must not be NULL and policy for service_context->region must
-// match. See the comments for uvm_va_block_check_policy_is_valid().  If
-// va_block is a HMM block, va_block_context->hmm.vma must be valid.  See the
+// match. See the comments for uvm_va_block_check_policy_is_valid(). If
+// va_block is a HMM block, va_block_context->hmm.vma must be valid. See the
 // comments for uvm_hmm_check_context_vma_is_valid() in uvm_hmm.h.
 // service_context must be initialized by calling uvm_va_block_service_copy()
 // before calling this function.
@@ -1499,8 +1535,8 @@ uvm_gpu_chunk_t *uvm_va_block_lookup_gpu_chunk(uvm_va_block_t *va_block, uvm_gpu
 //
 // service_context and service_context->block_context must not be NULL and
 // policy for the region must match. See the comments for
-// uvm_va_block_check_policy_is_valid().  If va_block is a HMM block,
-// service->block_context->hmm.vma must be valid.  See the comments for
+// uvm_va_block_check_policy_is_valid(). If va_block is a HMM block,
+// service->block_context->hmm.vma must be valid. See the comments for
 // uvm_hmm_check_context_vma_is_valid() in uvm_hmm.h.
 //
 // LOCKING: The caller must hold the va_block lock. If
@@ -1550,7 +1586,8 @@ void uvm_va_block_retry_init(uvm_va_block_retry_t *uvm_va_block_retry);
 // Frees all the remaining free chunks and unpins all the used chunks.
 void uvm_va_block_retry_deinit(uvm_va_block_retry_t *uvm_va_block_retry, uvm_va_block_t *va_block);

-// Evict all chunks from the block that are subchunks of the passed in root_chunk.
+// Evict all chunks from the block that are subchunks of the passed in
+// root_chunk.
 //
 // Add all the work tracking the eviction to the tracker.
 //
@@ -1567,6 +1604,9 @@ NV_STATUS uvm_test_va_block_inject_error(UVM_TEST_VA_BLOCK_INJECT_ERROR_PARAMS *
 NV_STATUS uvm_test_change_pte_mapping(UVM_TEST_CHANGE_PTE_MAPPING_PARAMS *params, struct file *filp);
 NV_STATUS uvm_test_va_block_info(UVM_TEST_VA_BLOCK_INFO_PARAMS *params, struct file *filp);
 NV_STATUS uvm_test_va_residency_info(UVM_TEST_VA_RESIDENCY_INFO_PARAMS *params, struct file *filp);
+NV_STATUS uvm_test_va_block_discard_status(UVM_TEST_VA_BLOCK_DISCARD_STATUS_PARAMS *params, struct file *filp);
+NV_STATUS uvm_test_va_block_discard_check_pmm_state(UVM_TEST_VA_BLOCK_DISCARD_CHECK_PMM_STATE_PARAMS *params,
+                                                    struct file *filp);

 // Compute the offset in system pages of addr from the start of va_block.
 static uvm_page_index_t uvm_va_block_cpu_page_index(uvm_va_block_t *va_block, NvU64 addr)
@@ -2139,16 +2179,12 @@ struct page *uvm_cpu_chunk_get_cpu_page(uvm_va_block_t *va_block, uvm_cpu_chunk_
 struct page *uvm_va_block_get_cpu_page(uvm_va_block_t *va_block, uvm_page_index_t page_index);

 // Physically map a CPU chunk so it is DMA'able from all registered GPUs.
-// nid cannot be NUMA_NO_NODE.
 // Locking: The va_block lock must be held.
-NV_STATUS uvm_va_block_map_cpu_chunk_on_gpus(uvm_va_block_t *va_block,
-                                             uvm_cpu_chunk_t *chunk,
-                                             uvm_page_index_t page_index);
+NV_STATUS uvm_va_block_map_cpu_chunk_on_gpus(uvm_va_block_t *va_block, uvm_cpu_chunk_t *chunk);

 // Physically unmap a CPU chunk from all registered GPUs.
 // Locking: The va_block lock must be held.
-void uvm_va_block_unmap_cpu_chunk_on_gpus(uvm_va_block_t *va_block,
-                                          uvm_cpu_chunk_t *chunk);
+void uvm_va_block_unmap_cpu_chunk_on_gpus(uvm_va_block_t *va_block, uvm_cpu_chunk_t *chunk);

 // Remove any CPU chunks in the given region.
 // Locking: The va_block lock must be held.
@@ -2163,8 +2199,7 @@ NvU64 uvm_va_block_get_physical_size(uvm_va_block_t *block,
                                     uvm_page_index_t page_index);

 // Get CPU page size or 0 if it is not mapped
-NvU64 uvm_va_block_page_size_cpu(uvm_va_block_t *va_block,
-                                 uvm_page_index_t page_index);
+NvU64 uvm_va_block_page_size_cpu(uvm_va_block_t *va_block, uvm_page_index_t page_index);

 // Get GPU page size or 0 if it is not mapped on the given GPU
 NvU64 uvm_va_block_page_size_gpu(uvm_va_block_t *va_block, uvm_gpu_id_t gpu_id, uvm_page_index_t page_index);
@@ -2262,8 +2297,8 @@ NV_STATUS uvm_va_block_populate_page_cpu(uvm_va_block_t *va_block,
 // otherwise it will be initialized and deinitialized by the macro.
 //
 // The macro also locks and unlocks the block's lock internally as it's expected
-// that the block's lock has been unlocked and relocked whenever the function call
-// returns NV_ERR_MORE_PROCESSING_REQUIRED and this makes it clear that the
+// that the block's lock has been unlocked and relocked whenever the function
+// call returns NV_ERR_MORE_PROCESSING_REQUIRED and this makes it clear that the
 // block's state is not locked across these calls.
 #define UVM_VA_BLOCK_LOCK_RETRY(va_block, block_retry, call) ({     \
    NV_STATUS __status;                                             \