535.43.02

2026-02-06 08:09:58 +00:00 · 2023-05-30 10:11:36 -07:00
parent 6dd092ddb7
commit eb5c7665a1
1403 changed files with 295367 additions and 86235 deletions
--- a/src/nvidia/inc/kernel/gpu/ce/kernel_ce_private.h
+++ b/src/nvidia/inc/kernel/gpu/ce/kernel_ce_private.h
@@ -39,7 +39,7 @@
 * @return NV_OK if the conversion is successful.
 */
 static NV_INLINE
-NV_STATUS ceIndexFromType(OBJGPU *pGpu, NvHandle hClient, RM_ENGINE_TYPE rmEngineType, NvU32 *ceIdx)
+NV_STATUS ceIndexFromType(OBJGPU *pGpu, Device *pDevice, RM_ENGINE_TYPE rmEngineType, NvU32 *ceIdx)
 {
    NV_STATUS status = NV_OK;
    RM_ENGINE_TYPE localRmEngType = rmEngineType;
@@ -56,7 +56,7 @@ NV_STATUS ceIndexFromType(OBJGPU *pGpu, NvHandle hClient, RM_ENGINE_TYPE rmEngin
        KernelMIGManager *pKernelMIGManager = GPU_GET_KERNEL_MIG_MANAGER(pGpu);
        MIG_INSTANCE_REF ref;

-        status = kmigmgrGetInstanceRefFromClient(pGpu, pKernelMIGManager, hClient, &ref);
+        status = kmigmgrGetInstanceRefFromDevice(pGpu, pKernelMIGManager, pDevice, &ref);

        if (status != NV_OK)
            return status;
--- a/src/nvidia/inc/kernel/gpu/conf_compute/ccsl.h
+++ b/src/nvidia/inc/kernel/gpu/conf_compute/ccsl.h
@@ -0,0 +1,224 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2021-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef CCSL_H
+#define CCSL_H
+
+#include "nvstatus.h"
+#include "nvmisc.h"
+#include "kernel/gpu/conf_compute/conf_compute.h"
+
+typedef struct ccslContext_t *pCcslContext;
+
+/*
+ * Initializes a context by providing client and channel information.
+ *
+ * ccslContext [in / out]
+ * hClient     [in]
+ * hChannel    [in]
+ */
+NV_STATUS
+ccslContextInitViaChannel
+(
+    pCcslContext *ppCtx,
+    NvHandle      hClient,
+    NvHandle      hChannel
+);
+
+/*
+ * Initializes a context by providing key ID information.
+ *
+ * ConfidentialCompute [in]
+ * ccslContext         [in / out]
+ * globalKeyId         [in]
+ */
+NV_STATUS
+ccslContextInitViaKeyId
+(
+    ConfidentialCompute *pConfCompute,
+    pCcslContext        *ppCtx,
+    NvU32                globalKeyId
+);
+
+/*
+ * Clears the context and erases sensitive material such as keys.
+ *
+ * ccslContext [in / out]
+ */
+void
+ccslContextClear
+(
+    pCcslContext ctx
+);
+
+/* To be called before library client triggers a Device-side encryption.
+ * Attempts to increment the library's Device-side message counter and returns an error if it will overflow.
+ *
+ * ccslContext [in]
+ * decryptIv   [in]
+ *
+ * Returns NV_ERR_INSUFFICIENT_RESOURCES if the next Device-side encryption will overflow.
+ * Returns NV_OK otherwise.
+ */
+NV_STATUS
+ccslLogDeviceEncryption
+(
+    pCcslContext  ctx,
+    NvU8         *decryptIv
+);
+
+/* Request the next IV to be used in encryption. Storing it explicitly enables the caller
+ * to perform encryption out of order using EncryptWithIv
+ *
+ * ccslContext [in / out]
+ * encryptIv   [out]
+ *
+ * Returns NV_ERR_INSUFFICIENT_RESOURCES if the next encryption will overflow.
+ * Returns NV_OK otherwise.
+ */
+NV_STATUS
+ccslAcquireEncryptionIv
+(
+    pCcslContext  ctx,
+    NvU8         *encryptIv
+);
+
+/* Rotate the IV for the given direction.
+ *
+ * ccslContext [in / out]
+ * direction   [in]
+ */
+NV_STATUS
+ccslRotateIv
+(
+    pCcslContext ctx,
+    NvU8         direction
+);
+
+/*
+ * Encrypt and sign data using provided IV
+ *
+ * ccslContext   [in]
+ * bufferSize    [in]     - Size of buffer to be encrypted in units of bytes.
+ * inputBuffer   [in]     - Address of plaintext input buffer. For performance it should be 16-byte aligned.
+ * encryptionIv  [in/out] - IV to use for encryption. The IV will be "dirtied" after this operation.
+ * outputBuffer  [in/out] - Address of ciphertext output buffer.
+ * authTagBuffer [in/out] - Address of authentication tag. In APM it is 32 bytes. In HCC it is 16 bytes.
+ *
+ * Returns NV_OK.
+ */
+NV_STATUS
+ccslEncryptWithIv
+(
+    pCcslContext  ctx,
+    NvU32         bufferSize,
+    NvU8 const   *inputBuffer,
+    NvU8         *encryptIv,
+    NvU8         *outputBuffer,
+    NvU8         *authTagBuffer
+);
+
+/*
+ * If message counter will not overflow then encrypt and sign data.
+ *
+ * ccslContext   [in]
+ * bufferSize    [in]     - Size of buffer to be encrypted in units of bytes.
+ * inputBuffer   [in]     - Address of plaintext input buffer. For performance it should be 16-byte aligned.
+ * outputBuffer  [in/out] - Address of ciphertext output buffer.
+ * authTagBuffer [in/out] - Address of authentication tag. In APM it is 32 bytes. In HCC it is 16 bytes.
+ *
+ * Returns NV_ERR_INSUFFICIENT_RESOURCES if message counter will overflow.
+ * Returns NV_OK otherwise.
+ */
+NV_STATUS
+ccslEncrypt
+(
+    pCcslContext  ctx,
+    NvU32         bufferSize,
+    NvU8 const   *inputBuffer,
+    NvU8         *outputBuffer,
+    NvU8         *authTagBuffer
+);
+
+/*
+ * First verify authentication tag. If authentication passes then the data is decrypted.
+ *
+ * ccslContext   [in]
+ * bufferSize    [in]     - Size of buffer to be decrypted in units of bytes.
+ * inputBuffer   [in]     - Address of ciphertext input buffer. For performance it should be 16-byte aligned.
+ * outputBuffer  [in/out] - Address of plaintext output buffer.
+ * authTagBuffer [in]     - Address of authentication tag. In APM it is 32 bytes. In HCC it is 16 bytes.
+ *
+ * Returns NV_ERR_INVALID_DATA if verification of the authentication tag fails.
+ * Returns NV_OK otherwise.
+ */
+NV_STATUS
+ccslDecrypt
+(
+    pCcslContext  ctx,
+    NvU32         bufferSize,
+    NvU8 const   *inputBuffer,
+    NvU8 const   *decryptIv,
+    NvU8         *outputBuffer,
+    NvU8 const   *authTagBuffer
+);
+
+/*
+ * Sign the plaintext message.
+ *
+ * ccslContext   [in]
+ * bufferSize    [in]     - Size of buffer to be signed in units of bytes.
+ * inputBuffer   [in]     - Address of input buffer. For performance it should be 16-byte aligned.
+ * authTagBuffer [in/out] - Address of authentication tag. In HCC it is 32 bytes.
+ *
+ * Returns NV_OK
+ */
+NV_STATUS
+ccslSign
+(
+    pCcslContext  ctx,
+    NvU32         bufferSize,
+    NvU8 const   *inputBuffer,
+    NvU8         *authTagBuffer
+);
+
+#define CCSL_DIR_HOST_TO_DEVICE 0
+#define CCSL_DIR_DEVICE_TO_HOST 1
+
+/*
+ * Returns the number of messages that can be encrypted by the CPU (CCSL_DIR_HOST_TO_DEVICE)
+ * or encrypted by the GPU (CCSL_DIR_DEVICE_TO_HOST) before the message counter will overflow.
+ *
+ * ccslContext [in]
+ * direction   [in]  - Either CCSL_DIR_HOST_TO_DEVICE or CCSL_DIR_DEVICE_TO_HOST.
+ * messageNum  [out] - Number of messages that can be encrypted before overflow.
+ */
+NV_STATUS
+ccslQueryMessagePool
+(
+    pCcslContext  ctx,
+    NvU8          direction,
+    NvU64        *messageNum
+);
+
+#endif // CCSL_H
--- a/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute.h
+++ b/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute.h
@@ -0,0 +1,3 @@
+
+#include "g_conf_compute_nvoc.h"
+
--- a/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute_api.h
+++ b/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute_api.h
@@ -0,0 +1,3 @@
+
+#include "g_conf_compute_api_nvoc.h"
+
--- a/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute_keystore.h
+++ b/src/nvidia/inc/kernel/gpu/conf_compute/conf_compute_keystore.h
@@ -0,0 +1,96 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2021-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef CONF_COMPUTE_KEYSTORE_H
+#define CONF_COMPUTE_KEYSTORE_H
+
+#include "nvtypes.h"
+#include "nvstatus.h"
+#include "cc_drv.h"
+#include "kernel/gpu/fifo/kernel_channel.h"
+
+// Named values for ccKeyStoreDeposit()'s slotNumber parameter.
+#define KEYSTORE_SLOT_GSP             0
+#define KEYSTORE_SLOT_SEC2            1
+// LCE index can range from 0 to 7 inclusive.
+#define KEYSTORE_SLOT_LCE_UMD(index)  (2 + (index) * 3)
+#define KEYSTORE_SLOT_LCE_KMD(index)  (3 + (index) * 3)
+#define KEYSTORE_SLOT_LCE_MGPU(index) (4 + (index) * 3)
+
+/*!
+ * @brief Initialize the keystore.
+ *
+ * @param[in] pGpu Pointer to GPU object.
+ *
+ * @return NV_ERR_INVALID_STATE if system is not in Confidential Compute mode.
+ */
+NV_STATUS
+ccKeyStoreInit (OBJGPU *pGpu);
+
+/*!
+ * @brief Deposits a KMB into a keystore slot.
+ *
+ * @param[in] slotNumber        Slot number into which the KMB will be deposited.
+ * @param[in] keyMaterialBundle Pair of key / IV / IV mask tuples. IV will be set to 0 by function.
+ *
+ * @return NV_ERR_INVALID_INDEX if slotNumber is illegal, NV_OK otherwise.
+ */
+NV_STATUS
+ccKeyStoreDeposit
+(
+    NvU32 slotNumber,
+    CC_KMB keyMaterialBundle
+);
+
+/*!
+ * @brief Retrieves a KMB based on the channel. The keystore uses channel
+          information such as engine type and the associated privilege mode
+          to determine which KMB to fetch.
+ *        The IV's channel counter for the given direction is pre-incremented.
+ *
+ * @param[in]  pKernelChannel
+ * @param[in]  rotateOperation    Either:
+                                  ROTATE_IV_ENCRYPT
+                                  ROTATE_IV_DECRYPT
+                                  ROTATE_IV_ALL_VALID
+ * @param[out] keyMaterialBundle  The KMB for the given channel.
+ *
+ * @return NV_ERR_INSUFFICIENT_RESOURCES if channel counter overflow would occur.
+           NV_ERR_GENERIC for other errors.
+ *         NV_OK otherwise.
+ */
+NV_STATUS
+ccKeyStoreRetrieveViaChannel
+(
+    KernelChannel *pKernelChannel,
+    ROTATE_IV_TYPE rotateOperation,
+    PCC_KMB keyMaterialBundle
+);
+
+/*!
+ * @brief Clears the contents of the keystore.
+ */
+void
+cckeyStoreClear (void);
+
+#endif // CONF_COMPUTE_KEYSTORE_H
--- a/src/nvidia/inc/kernel/gpu/falcon/falcon_common.h
+++ b/src/nvidia/inc/kernel/gpu/falcon/falcon_common.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2021-202 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 2021-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -58,4 +58,9 @@
 */
 #define FLCN_CTX_ENG_BUFFER_SIZE_HW      4096

+/*!
+ * Number of register read needed for reset signal propagation
+ */
+#define FLCN_RESET_PROPAGATION_DELAY_COUNT    10
+
 #endif  // FALCON_COMMON_H
--- a/src/nvidia/inc/kernel/gpu/gpu_child_class_defs.h
+++ b/src/nvidia/inc/kernel/gpu/gpu_child_class_defs.h
@@ -0,0 +1,47 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2004-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef GPU_CHILD_CLASS_DEFS_H
+#define GPU_CHILD_CLASS_DEFS_H
+
+/*!
+ * @file
+ * @details Provides the class definitions for every GPU child class without the
+ *          need to include every individual header.
+ */
+
+#include "core/prelude.h"
+
+#define GPU_CHILD_CLASS_DEFS_GPU_CHILD(className, accessorName, numInstances, bConstructEarly, gpuField) \
+    extern const struct NVOC_CLASS_DEF NV_CONCATENATE(__nvoc_class_def_, className);
+
+#define GPU_CHILD \
+    GPU_CHILD_CLASS_DEFS_GPU_CHILD
+#include "gpu/gpu_child_list.h"
+
+// Sub-classes of GPU children
+// Pmu sub-classes
+extern const struct NVOC_CLASS_DEF __nvoc_class_def_Pmu10;
+extern const struct NVOC_CLASS_DEF __nvoc_class_def_Pmu20;
+
+#endif // GPU_CHILD_CLASS_DEFS_H
--- a/src/nvidia/inc/kernel/gpu/gpu_child_list.h
+++ b/src/nvidia/inc/kernel/gpu/gpu_child_list.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2004-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 2004-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -105,12 +105,12 @@
 #if GPU_CHILD_MODULE(KERNEL_DISPLAY)
    GPU_CHILD_SINGLE_INST( KernelDisplay,        GPU_GET_KERNEL_DISPLAY,              1,                NV_FALSE,        pKernelDisplay   )
 #endif
-#if GPU_CHILD_MODULE(DISP)
-    GPU_CHILD_SINGLE_INST( OBJDISP,              GPU_GET_DISP,                        1,                NV_FALSE,        pDisp            )
-#endif
 #if GPU_CHILD_MODULE(TMR)
    GPU_CHILD_SINGLE_INST( OBJTMR,               GPU_GET_TIMER,                       1,                NV_TRUE,         pTmr             )
 #endif
+#if GPU_CHILD_MODULE(DISP)
+    GPU_CHILD_SINGLE_INST( OBJDISP,              GPU_GET_DISP,                        1,                NV_FALSE,        pDisp            )
+#endif
 #if GPU_CHILD_MODULE(BUS)
    GPU_CHILD_SINGLE_INST( OBJBUS,               GPU_GET_BUS,                         1,                NV_FALSE,        pBus             )
 #endif
@@ -297,8 +297,11 @@
 #if GPU_CHILD_MODULE(OFA)
    GPU_CHILD_SINGLE_INST( OBJOFA,               GPU_GET_OFA,                         1,                NV_FALSE,        pOfa             )
 #endif
+#if RMCFG_MODULE_CONF_COMPUTE && GPU_CHILD_MODULE(CONF_COMPUTE)
+    GPU_CHILD_SINGLE_INST( ConfidentialCompute,  GPU_GET_CONF_COMPUTE,                1,                NV_TRUE,         pConfCompute      )
+#endif
 #if RMCFG_MODULE_KERNEL_CCU && GPU_CHILD_MODULE(KERNEL_CCU)
-    GPU_CHILD_SINGLE_INST( KernelCcu,            GPU_GET_KERNEL_CCU,                  1,                NV_FALSE,        pKernelCcu        )   
+    GPU_CHILD_SINGLE_INST( KernelCcu,            GPU_GET_KERNEL_CCU,                  1,                NV_FALSE,        pKernelCcu        )
 #endif

 // Undefine the entry macros to simplify call sites
--- a/src/nvidia/inc/kernel/gpu/gpu_engine_type.h
+++ b/src/nvidia/inc/kernel/gpu/gpu_engine_type.h
@@ -99,6 +99,7 @@ typedef enum
 #define RM_ENGINE_TYPE_NVENC_SIZE 3
 #define RM_ENGINE_TYPE_NVJPEG_SIZE 8
 #define RM_ENGINE_TYPE_NVDEC_SIZE 8
+#define RM_ENGINE_TYPE_OFA_SIZE 1
 #define RM_ENGINE_TYPE_GR_SIZE 8

 // Indexed engines
@@ -118,6 +119,15 @@ typedef enum
 #define RM_ENGINE_TYPE_IS_NVJPEG(i)  (((i) >= RM_ENGINE_TYPE_NVJPEG0) && ((i) < RM_ENGINE_TYPE_NVJPEG(RM_ENGINE_TYPE_NVJPEG_SIZE)))
 #define RM_ENGINE_TYPE_NVJPEG_IDX(i) ((i) - RM_ENGINE_TYPE_NVJPEG0)

+#define RM_ENGINE_TYPE_OFA(i)      (RM_ENGINE_TYPE_OFA+(i))
+#define RM_ENGINE_TYPE_IS_OFA(i)   (((i) >= RM_ENGINE_TYPE_OFA) && ((i) < RM_ENGINE_TYPE_OFA(RM_ENGINE_TYPE_OFA_SIZE)))
+#define RM_ENGINE_TYPE_OFA_IDX(i)  ((i) - RM_ENGINE_TYPE_OFA)
+
+#define RM_ENGINE_TYPE_IS_VIDEO(i) (RM_ENGINE_TYPE_IS_NVENC(i)  | \
+                                    RM_ENGINE_TYPE_IS_NVDEC(i)  | \
+                                    RM_ENGINE_TYPE_IS_NVJPEG(i) | \
+                                    RM_ENGINE_TYPE_IS_OFA(i))
+
 #define RM_ENGINE_TYPE_GR(i)       (RM_ENGINE_TYPE_GR0 + (i))
 #define RM_ENGINE_TYPE_IS_GR(i)    (((i) >= RM_ENGINE_TYPE_GR0) && ((i) < RM_ENGINE_TYPE_GR(RM_ENGINE_TYPE_GR_SIZE)))
 #define RM_ENGINE_TYPE_GR_IDX(i)   ((i) - RM_ENGINE_TYPE_GR0)
--- a/src/nvidia/inc/kernel/gpu/gpu_fabric_probe.h
+++ b/src/nvidia/inc/kernel/gpu/gpu_fabric_probe.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 1993-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -33,28 +33,31 @@

 #define GPU_FABRIC_PROBE_DEFAULT_PROBE_SLOWDOWN_THRESHOLD 10

-typedef struct GPU_FABRIC_PROBE_INFO GPU_FABRIC_PROBE_INFO;
+typedef struct GPU_FABRIC_PROBE_INFO_KERNEL GPU_FABRIC_PROBE_INFO_KERNEL;

 NV_STATUS gpuFabricProbeStart(OBJGPU *pGpu,
-                              GPU_FABRIC_PROBE_INFO **ppGpuFabricProbeInfo);
-void gpuFabricProbeStop(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
+                              GPU_FABRIC_PROBE_INFO_KERNEL **ppGpuFabricProbeInfoKernel);
+void gpuFabricProbeStop(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);

-void gpuFabricProbeSuspend(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
-NV_STATUS gpuFabricProbeResume(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
+void gpuFabricProbeSuspend(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);
+NV_STATUS gpuFabricProbeResume(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);

-NV_STATUS gpuFabricProbeGetGpuFabricHandle(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pHandle);
-NV_STATUS gpuFabricProbeGetGfId(GPU_FABRIC_PROBE_INFO *pInfo, NvU32 *pGfId);
-NV_STATUS gpuFabricProbeGetfmCaps(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pFmCaps);
-NV_STATUS gpuFabricProbeGetClusterUuid(GPU_FABRIC_PROBE_INFO *pInfo, NvUuid *pClusterUuid);
-NV_STATUS gpuFabricProbeGetFabricPartitionId(GPU_FABRIC_PROBE_INFO *pInfo, NvU16 *pFabricPartitionId);
-NV_STATUS gpuFabricProbeGetGpaAddress(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pGpaAddress);
-NV_STATUS gpuFabricProbeGetGpaAddressRange(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pGpaAddressRange);
-NV_STATUS gpuFabricProbeGetFlaAddress(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pFlaAddress);
-NV_STATUS gpuFabricProbeGetFlaAddressRange(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *pFlaAddressRange);
-NV_STATUS gpuFabricProbeGetNumProbeReqs(GPU_FABRIC_PROBE_INFO *pInfo, NvU64 *numProbes);
+NV_STATUS gpuFabricProbeGetGpuFabricHandle(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pHandle);
+NV_STATUS gpuFabricProbeGetGfId(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU32 *pGfId);
+NV_STATUS gpuFabricProbeGetfmCaps(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pFmCaps);
+NV_STATUS gpuFabricProbeGetClusterUuid(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvUuid *pClusterUuid);
+NV_STATUS gpuFabricProbeGetFabricPartitionId(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU16 *pFabricPartitionId);
+NV_STATUS gpuFabricProbeGetGpaAddress(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pGpaAddress);
+NV_STATUS gpuFabricProbeGetGpaAddressRange(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pGpaAddressRange);
+NV_STATUS gpuFabricProbeGetFlaAddress(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pFlaAddress);
+NV_STATUS gpuFabricProbeGetFlaAddressRange(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *pFlaAddressRange);
+NV_STATUS gpuFabricProbeGetNumProbeReqs(GPU_FABRIC_PROBE_INFO_KERNEL *pInfo, NvU64 *numProbes);

-NvBool gpuFabricProbeIsReceived(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
-NvBool gpuFabricProbeIsSuccess(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
-NV_STATUS gpuFabricProbeGetFmStatus(GPU_FABRIC_PROBE_INFO *pGpuFabricProbeInfo);
+NvBool gpuFabricProbeIsReceived(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);
+NvBool gpuFabricProbeIsSuccess(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);
+NV_STATUS gpuFabricProbeGetFmStatus(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel);
 NvBool gpuFabricProbeIsSupported(OBJGPU *pGpu);
+NV_STATUS gpuFabricProbeSetBwMode(NvU8 mode);
+NV_STATUS gpuFabricProbeGetlinkMaskToBeReduced(GPU_FABRIC_PROBE_INFO_KERNEL *pGpuFabricProbeInfoKernel,
+                                               NvU32 *linkMaskToBeReduced);
 #endif // GPU_FABRIC_PROBE_H
--- a/src/nvidia/inc/kernel/gpu/gpu_timeout.h
+++ b/src/nvidia/inc/kernel/gpu/gpu_timeout.h
@@ -139,6 +139,10 @@ static NV_INLINE NvU32 timeoutApplyScale(TIMEOUT_DATA *pTD, NvU32 timeout)
 #define gpuScaleTimeout(g,a)         timeoutApplyScale(&(g)->timeoutData, a)
 #define gpuTimeoutCondWait(g,a,b,t)  timeoutCondWait(&(g)->timeoutData, t, a, b, __LINE__)

-#define GPU_ENG_RESET_TIMEOUT_VALUE(g, t) (t)
+//
+// In SCSIM simulation platform, both CPU and GPU are simulated and the reg write/read itself
+// takes more time. This helper macro handles it with increased timeout value.
+//
+#define GPU_ENG_RESET_TIMEOUT_VALUE(g, t) ((gpuIsSelfHosted(g) && IS_SIMULATION(g)) ? 1000 : (t))

 #endif // _GPU_TIMEOUT_H_
--- a/src/nvidia/inc/kernel/gpu/gr/kernel_graphics_context_buffers.h
+++ b/src/nvidia/inc/kernel/gpu/gr/kernel_graphics_context_buffers.h
@@ -34,7 +34,7 @@
 *
 * Not all buffer types are supported on every GPU.
 */
-#define GR_GLOBALCTX_BUFFER_DEF(x) \
+#define GR_GLOBALCTX_BUFFER_DEF(x)                                                 \
    NV_ENUM_ENTRY(x, GR_GLOBALCTX_BUFFER_BUNDLE_CB,                    0x00000000) \
    NV_ENUM_ENTRY(x, GR_GLOBALCTX_BUFFER_PAGEPOOL,                     0x00000001) \
    NV_ENUM_ENTRY(x, GR_GLOBALCTX_BUFFER_ATTRIBUTE_CB,                 0x00000002) \
@@ -50,7 +50,7 @@ NV_ENUM_DEF(GR_GLOBALCTX_BUFFER, GR_GLOBALCTX_BUFFER_DEF)
 #define GR_GLOBALCTX_BUFFER_COUNT               NV_ENUM_SIZE(GR_GLOBALCTX_BUFFER)


-#define GR_CTX_BUFFER_DEF(x) \
+#define GR_CTX_BUFFER_DEF(x)                                 \
        NV_ENUM_ENTRY(x, GR_CTX_BUFFER_MAIN,     0x00000000) \
        NV_ENUM_ENTRY(x, GR_CTX_BUFFER_ZCULL,    0x00000001) \
        NV_ENUM_ENTRY(x, GR_CTX_BUFFER_PM,       0x00000002) \
--- a/src/nvidia/inc/kernel/gpu/gsp/gsp_fw_heap.h
+++ b/src/nvidia/inc/kernel/gpu/gsp/gsp_fw_heap.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 2022-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -25,8 +25,55 @@
 #define GSP_FW_HEAP_H

 // Static defines for the GSP FW WPR Heap
-#define GSP_FW_HEAP_SIZE_LIBOS2            (64u << 20)
-#define GSP_FW_HEAP_SIZE_LIBOS3_BAREMETAL  (84u << 20)
-#define GSP_FW_HEAP_SIZE_LIBOS3_VGPU      (549u << 20)
+#define GSP_FW_HEAP_PARAM_OS_SIZE_LIBOS2                   (0 << 20)   // No FB heap usage
+#define GSP_FW_HEAP_PARAM_OS_SIZE_LIBOS3                  (20 << 20)
+
+//
+// Calibrated by observing RM init heap usage - the amount of GSP-RM heap memory
+// used during GSP-RM boot and Kernel RM initialization, up to and including the
+// first client subdevice allocation.
+//
+#define GSP_FW_HEAP_PARAM_BASE_RM_SIZE_TU10X               (8 << 20)   // Turing thru Ada
+#define GSP_FW_HEAP_PARAM_BASE_RM_SIZE_GH100              (14 << 20)   // Hopper+
+
+//
+// Calibrated by observing RM init heap usage on GPUs with various FB sizes.
+// This seems to fit the data fairly well, but is likely inaccurate (differences
+// in heap usage are more likely correlate with GPU architecture than FB size).
+// TODO: this requires more detailed profiling and tuning.
+//
+#define GSP_FW_HEAP_PARAM_SIZE_PER_GB_FB                  (96 << 10)   // All architectures
+
+//
+// This number is calibrated by profiling the WPR heap usage of a single
+// client channel allocation. In practice, channel allocations on newer
+// architectures are around 44KB-46KB (depending on internal memory
+// tracking overhead configured in GSP-RM).
+//
+// Note: Turing supports 4096 channels vs 2048 on Ampere+, but the heap is
+// sized to support only 2048 channels - otherwise the Turing heap balloons
+// to 176MB+ on already small-FB parts.
+//
+// Note: The 2048 channel limit is per-runlist. GSP-RM currently uses only
+// a single ChID space across all engines, because per-runlist channel RAM is
+// disabled by default in most configurations. If/once per-runlist ChID spaces
+// are used on GSP-RM, this will likely no longer be sufficient/relevant as
+// the memory that could be needed for client channel allocations will far
+// exceed the amount we can carve out for GSP-RM's heap (max ChID will no longer
+// be the limiter).
+//
+#define GSP_FW_HEAP_PARAM_CLIENT_ALLOC_SIZE      ((48 << 10) * 2048)   // Support 2048 channels
+
+#define GSP_FW_HEAP_SIZE_VGPU_DEFAULT                    (549 << 20)   // Default for all VGPU configs
+
+// Min/max bounds for heap size override by regkey
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS2_MIN_MB                (64u)
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS2_MAX_MB               (256u)
+
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS3_BAREMETAL_MIN_MB      (84u)
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS3_BAREMETAL_MAX_MB     (276u)
+
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS3_VGPU_MIN_MB          (549u)
+#define GSP_FW_HEAP_SIZE_OVERRIDE_LIBOS3_VGPU_MAX_MB         (1024u)

 #endif // GSP_FW_HEAP_H
--- a/src/nvidia/inc/kernel/gpu/gsp/gsp_init_args.h
+++ b/src/nvidia/inc/kernel/gpu/gsp/gsp_init_args.h
@@ -53,6 +53,12 @@ typedef struct
    MESSAGE_QUEUE_INIT_ARGUMENTS      messageQueueInitArguments;
    GSP_SR_INIT_ARGUMENTS             srInitArguments;
    NvU32                             gpuInstance;
+
+    struct
+    {
+        NvU64                         pa;
+        NvU64                         size;
+    } profilerArgs;
 } GSP_ARGUMENTS_CACHED;

 #endif // GSP_INIT_ARGS_H
--- a/src/nvidia/inc/kernel/gpu/gsp/gsp_static_config.h
+++ b/src/nvidia/inc/kernel/gpu/gsp/gsp_static_config.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2019-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 2019-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -75,7 +75,7 @@ typedef struct GspStaticConfigInfo_t
    GspSMInfo SM_info;

    NvBool poisonFuseEnabled;
-  
+
    NvU64 fb_length;
    NvU32 fbio_mask;
    NvU32 fb_bus_width;
@@ -100,6 +100,7 @@ typedef struct GspStaticConfigInfo_t
    NvBool bIsMobile;
    NvBool bIsGc6Rtd3Allowed;
    NvBool bIsGcOffRtd3Allowed;
+    NvBool bIsGcoffLegacyAllowed;

    NvU64 bar1PdeBase;
    NvU64 bar2PdeBase;
@@ -127,7 +128,10 @@ typedef struct GspStaticConfigInfo_t
    // Subdevice handle for internal RMAPI control.
    NvHandle hInternalSubdevice;

+    NvBool bSelfHostedMode;
    NvBool bAtsSupported;
+
+    NvBool bIsGpuUefi;
 } GspStaticConfigInfo;

 // Pushed from CPU-RM to GSP-RM
@@ -147,6 +151,7 @@ typedef struct GspSystemInfo
    NvU64 clPdbProperties;
    NvU32 Chipset;
    NvBool bGpuBehindBridge;
+    NvBool bMnocAvailable;
    NvBool bUpstreamL0sUnsupported;
    NvBool bUpstreamL1Unsupported;
    NvBool bUpstreamL1PorSupported;
@@ -155,6 +160,9 @@ typedef struct GspSystemInfo
    BUSINFO FHBBusInfo;
    BUSINFO chipsetIDInfo;
    ACPI_METHOD_DATA acpiMethodData;
+    NvU32 hypervisorType;
+    NvBool bIsPassthru;
+    NvU64 sysTimerOffsetNs;
 } GspSystemInfo;


--- a/src/nvidia/inc/kernel/gpu/gsp/message_queue_priv.h
+++ b/src/nvidia/inc/kernel/gpu/gsp/message_queue_priv.h
@@ -65,6 +65,7 @@ typedef struct _message_queue_info
    msgqHandle             hQueue;              // Do not allow requests when hQueue is null.
    NvU32                  txSeqNum;            // Next sequence number for tx.
    NvU32                  rxSeqNum;            // Next sequence number for rx.
+    NvU32                  txBufferFull;
    NvU32                  queueIdx;            // QueueIndex used to identify which task the message is supposed to be sent to.
 } MESSAGE_QUEUE_INFO;

--- a/src/nvidia/inc/kernel/gpu/intr/engine_idx.h
+++ b/src/nvidia/inc/kernel/gpu/intr/engine_idx.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 1993-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -61,6 +61,7 @@
 #define MC_ENGINE_IDX_CE7                           22
 #define MC_ENGINE_IDX_CE8                           23
 #define MC_ENGINE_IDX_CE9                           24
+#define MC_ENGINE_IDX_CE_MAX                        MC_ENGINE_IDX_CE9
 #define MC_ENGINE_IDX_VIC                           35
 #define MC_ENGINE_IDX_ISOHUB                        36
 #define MC_ENGINE_IDX_VGPU                          37
@@ -136,7 +137,8 @@
 #define MC_ENGINE_IDX_DISP_GSP                      163
 #define MC_ENGINE_IDX_REPLAYABLE_FAULT_CPU          164
 #define MC_ENGINE_IDX_NON_REPLAYABLE_FAULT_CPU      165
-#define MC_ENGINE_IDX_MAX                           166 // This must be kept as the max bit if
+#define MC_ENGINE_IDX_PXUC                          166
+#define MC_ENGINE_IDX_MAX                           167 // This must be kept as the max bit if
                                                        // we need to add more engines
 #define MC_ENGINE_IDX_INVALID                0xFFFFFFFF

@@ -159,6 +161,9 @@
 // Index ESCHED reference
 #define MC_ENGINE_IDX_ESCHEDn(x)        (MC_ENGINE_IDX_ESCHED + (x))

+#define MC_ENGINE_IDX_IS_CE(x) \
+    ((MC_ENGINE_IDX_CE(0) <= (x)) && ((x) <= MC_ENGINE_IDX_CE_MAX))
+
 MAKE_BITVECTOR(MC_ENGINE_BITVECTOR, MC_ENGINE_IDX_MAX);
 typedef MC_ENGINE_BITVECTOR *PMC_ENGINE_BITVECTOR;

--- a/src/nvidia/inc/kernel/gpu/intr/intr_common.h
+++ b/src/nvidia/inc/kernel/gpu/intr/intr_common.h
@@ -0,0 +1,43 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef INTR_COMMON_H
+#define INTR_COMMON_H 1
+/*! Common defines used by both Intr and OBJINTRABLE */
+
+
+/*! Kinds of interrupts that a unit can have. */
+typedef enum {
+    /*!
+     * Legacy concept of "stalling" interrupts.
+     *
+     * These may have a RETRIGGER mechanism.
+     */
+    INTR_KIND_INTERRUPT,
+    /*! Notification "non-stalling" interrupts. */
+    INTR_KIND_NOTIFICATION,
+    INTR_KIND_COUNT
+} INTR_KIND;
+
+
+#endif /* ifndef INTR_COMMON_H */
--- a/src/nvidia/inc/kernel/gpu/kern_gpu_power.h
+++ b/src/nvidia/inc/kernel/gpu/kern_gpu_power.h
@@ -0,0 +1,92 @@
+ /*
+ * SPDX-FileCopyrightText: Copyright (c) 2004-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef KERN_GPU_POWER_H
+#define KERN_GPU_POWER_H
+
+#include "ctrl/ctrl2080/ctrl2080power.h" // NV2080_CTRL_GC6_FLAVOR_ID_MAX
+#include "diagnostics/profiler.h"
+
+typedef enum
+{
+    GPU_GC6_STATE_POWERED_ON = 0                        ,
+    GPU_GC6_STATE_EXITED     = GPU_GC6_STATE_POWERED_ON ,
+    GPU_GC6_STATE_ENTERING                              ,
+    GPU_GC6_STATE_ENTERING_FAILED                       ,
+    GPU_GC6_STATE_ENTERED                               ,
+    GPU_GC6_STATE_EXITING                               ,
+    GPU_GC6_STATE_EXITING_FAILED                        ,
+} GPU_GC6_STATE;
+
+// TODO-SC use mask for the bool variables
+typedef struct
+{
+    GPU_GC6_STATE       currentState;
+    NvU32               executedStepMask;       // step mask executed during entry sequence
+    NvU32               stepMask[NV2080_CTRL_GC6_FLAVOR_ID_MAX];  // step mask cache
+} _GPU_GC6_STATE;
+
+// GPU event mask operation
+#define GC6_REFCOUNT_MASK_SET(pGpu, refCountBit)                      \
+    do                                                                \
+    {                                                                 \
+        if (pGpu != NULL)                                             \
+        {                                                             \
+            ((pGpu->gc6State.refCountMask) |= (NVBIT(refCountBit)));  \
+        }                                                             \
+    } while(0)
+
+#define GC6_REFCOUNT_MASK_CLEAR(pGpu, refCountBit)                    \
+    do                                                                \
+    {                                                                 \
+        if (pGpu != NULL)                                             \
+        {                                                             \
+            ((pGpu->gc6State.refCountMask) &= ~(NVBIT(refCountBit))); \
+        }                                                             \
+    } while(0)
+
+#define GC6_REFCOUNT_MASK_GET_FROM_EVENT(event) ((event / 2))
+
+// GC6 related defines
+#define GC6_FB_CLAMP_TIMEOUT_MS         10
+
+// Macros for GPU_GC6_STATE
+#define IS_GPU_GC6_STATE_POWERED_ON(obj) (obj->gc6State.currentState == GPU_GC6_STATE_POWERED_ON)
+#define IS_GPU_GC6_STATE_EXITED(obj)     (obj->gc6State.currentState == GPU_GC6_STATE_EXITED)
+#define IS_GPU_GC6_STATE_ENTERING(obj)   (obj->gc6State.currentState == GPU_GC6_STATE_ENTERING)
+#define IS_GPU_GC6_STATE_ENTERED(obj)    (obj->gc6State.currentState == GPU_GC6_STATE_ENTERED)
+#define IS_GPU_GC6_STATE_EXITING(obj)    (obj->gc6State.currentState == GPU_GC6_STATE_EXITING)
+
+#define SET_GPU_GC6_STATE(obj, state)    (obj->gc6State.currentState = state)
+#define SET_GPU_GC6_STATE_AND_LOG(obj, state)                         \
+    do {                                                              \
+        SET_GPU_GC6_STATE(obj, state);                                \
+        RMTRACE_GPU(_GC6_STATE, obj->gpuId, state, 0, 0, 0, 0, 0, 0); \
+    } while(0)
+
+//Macro to check is a given GC6 step id is set
+#define GPU_IS_GC6_STEP_ID_SET(stepId, stepMask)                      \
+        ((NVBIT(NV2080_CTRL_GC6_STEP_ID_##stepId) & (stepMask)) != 0)
+
+
+#endif // KERN_GPU_POWER_H
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/ce_utils.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/ce_utils.h
@@ -0,0 +1,122 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include "g_ce_utils_nvoc.h"
+
+#ifndef CE_UTILS_H
+#define CE_UTILS_H
+
+#include "gpu/gpu_resource.h" // GpuResource
+#include "class/cl0050.h"
+#include "ctrl/ctrl0050.h"
+
+#include "kernel/gpu/mem_mgr/channel_utils.h"
+
+typedef struct
+{
+    MEMORY_DESCRIPTOR *pMemDesc;
+    NvU64 offset;
+    NvU64 length;
+    NvU32 pattern;
+    NvU64 flags;
+    NvU64 submittedWorkId;   // Payload to poll for async completion
+} CEUTILS_MEMSET_PARAMS;
+
+typedef struct
+{
+    MEMORY_DESCRIPTOR *pSrcMemDesc;
+    MEMORY_DESCRIPTOR *pDstMemDesc;
+    NvU64 dstOffset;
+    NvU64 srcOffset;
+    NvU64 length;
+    NvU64 flags;
+    NvU64 submittedWorkId;   // Payload to poll for async completion
+} CEUTILS_MEMCOPY_PARAMS;
+
+
+NVOC_PREFIX(ceutils) class CeUtils : Object
+{
+public:
+    NV_STATUS ceutilsConstruct(CeUtils *pCeUtils, OBJGPU *pGpu, NV0050_ALLOCATION_PARAMETERS *pAllocParams);
+
+    void ceutilsDestruct(CeUtils *pCeUtils);
+
+    NV_STATUS ceutilsInitialize(CeUtils *pCeUtils, OBJGPU *pGpu, NV0050_ALLOCATION_PARAMETERS *pAllocParams);
+    void ceutilsDeinit(CeUtils *pCeUtils);
+    void ceutilsRegisterGPUInstance(CeUtils *pCeUtils, KERNEL_MIG_GPU_INSTANCE *pKernelMIGGPUInstance);
+
+    NV_STATUS ceutilsMemset(CeUtils *pCeUtils, CEUTILS_MEMSET_PARAMS *pParams);
+    NV_STATUS ceutilsMemcopy(CeUtils *pCeUtils, CEUTILS_MEMCOPY_PARAMS *pParams);
+
+    NvU64 ceutilsUpdateProgress(CeUtils *pCeUtils);
+    void ceutilsServiceInterrupts(CeUtils *pCeUtils);
+
+    //
+    // Internal states
+    //
+
+    NvHandle hClient;
+    NvHandle hDevice;
+    NvHandle hSubdevice;
+
+    OBJCHANNEL *pChannel;
+    KERNEL_MIG_GPU_INSTANCE *pKernelMIGGPUInstance;
+    OBJGPU *pGpu;
+
+    KernelCE *pKCe;
+    NvBool bUseVasForCeCopy;
+    NvU32 hTdCopyClass;
+    NvU64 lastSubmittedPayload;
+    NvU64 lastCompletedPayload;
+};
+
+
+#if defined(DEBUG) || defined (DEVELOP)
+NVOC_PREFIX(ceutilsapi) class CeUtilsApi : GpuResource
+{
+public:
+    NV_STATUS ceutilsapiConstruct(CeUtilsApi *pCeUtilsApi, CALL_CONTEXT *pCallContext,
+                                  RS_RES_ALLOC_PARAMS_INTERNAL *pParams)
+                                  : GpuResource(pCallContext, pParams);
+
+    void ceutilsapiDestruct(CeUtilsApi *pCeUtilsApi);
+
+    //
+    // Below APIs are only provided for SRT testing, thus only available for debug or
+    // develop driver builds
+    //
+    //
+    RMCTRL_EXPORT(NV0050_CTRL_CMD_MEMSET, RMCTRL_FLAGS(PRIVILEGED, API_LOCK_READONLY))
+    NV_STATUS ceutilsapiCtrlCmdMemset(CeUtilsApi *pCeUtilsApi, NV0050_CTRL_MEMSET_PARAMS *pParams);
+
+    RMCTRL_EXPORT(NV0050_CTRL_CMD_MEMCOPY, RMCTRL_FLAGS(PRIVILEGED, API_LOCK_READONLY))
+    NV_STATUS ceutilsapiCtrlCmdMemcopy(CeUtilsApi *pCeUtilsApi, NV0050_CTRL_MEMCOPY_PARAMS *pParams);
+
+    RMCTRL_EXPORT(NV0050_CTRL_CMD_CHECK_PROGRESS, RMCTRL_FLAGS(PRIVILEGED, API_LOCK_READONLY))
+    NV_STATUS ceutilsapiCtrlCmdCheckProgress(CeUtilsApi *pCeUtilsApi, NV0050_CTRL_CHECK_PROGRESS_PARAMS *pParams);
+
+    CeUtils *pCeUtils;
+};
+#endif
+
+#endif // CE_UTILS_H
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/ce_utils_sizes.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/ce_utils_sizes.h
@@ -0,0 +1,36 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _CE_UTILS_SIZES_H
+#define _CE_UTILS_SIZES_H
+
+#define CE_MAX_BYTES_PER_LINE                 0xffffffffULL
+#define CE_NUM_COPY_BLOCKS                    4096
+#define CE_CHANNEL_SEMAPHORE_SIZE             8
+#define CE_GPFIFO_SIZE                        NV906F_GP_ENTRY__SIZE * CE_NUM_COPY_BLOCKS
+#define CE_CHANNEL_NOTIFIER_SIZE              (sizeof(NvNotification) *                     \
+                                               NV_CHANNELGPFIFO_NOTIFICATION_TYPE__SIZE_1)
+#define CE_METHOD_SIZE_PER_BLOCK              0x64
+#define FAST_SCRUBBER_METHOD_SIZE_PER_BLOCK   0x78
+
+#endif //  _CE_UTILS_SIZES_H
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/channel_utils.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/channel_utils.h
@@ -0,0 +1,157 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _CHANNEL_UTILS_H_
+#define _CHANNEL_UTILS_H_
+
+#include "core/core.h"
+#include "gpu/gpu.h"
+#include "gpu/mem_mgr/mem_mgr.h"
+#include "gpu/ce/kernel_ce.h"
+#include "gpu/bus/kern_bus.h"
+#include "core/prelude.h"
+#include "rmapi/rs_utils.h"
+#include "nvos.h"
+
+#include "class/cl906f.h"
+#include "class/cl906f.h"
+#include "class/cl906fsw.h"
+
+#include "class/clb0b5.h"   // MAXWELL_DMA_COPY_A
+#include "class/clc0b5.h"   // PASCAL_DMA_COPY_A
+#include "class/clc1b5.h"   // PASCAL_DMA_COPY_B
+#include "class/clc3b5.h"   // VOLTA_DMA_COPY_A
+#include "class/clc5b5.h"   // TURING_DMA_COPY_A
+#include "class/clc6b5.h"   // AMPERE_DMA_COPY_A
+#include "class/clc7b5.h"   // AMPERE_DMA_COPY_B
+
+#include "class/clc8b5.h"   // HOPPER_DMA_COPY_A
+
+#include "class/clc86f.h"   // HOPPER_CHANNEL_GPFIFO_A
+
+#include "nvctassert.h"
+#include "vgpu/vgpu_guest_pma_scrubber.h"
+
+#define RM_SUBCHANNEL 0x0
+
+#define NV_PUSH_METHOD(OpType, SubCh, Method, Count)                    \
+    (DRF_DEF(906F, _DMA, _SEC_OP, OpType) |                             \
+     DRF_NUM(906F, _DMA, _METHOD_ADDRESS, (Method) >> 2) |              \
+     DRF_NUM(906F, _DMA, _METHOD_SUBCHANNEL, (SubCh)) |                 \
+     DRF_NUM(906F, _DMA, _METHOD_COUNT, (Count)))
+
+#define _NV_ASSERT_CONTIGUOUS_METHOD(a1, a2) NV_ASSERT((a2) - (a1) == 4)
+
+#define NV_PUSH_DATA(Data) MEM_WR32(pPtr++, (Data))
+
+#define _NV_PUSH_INC_1U(SubCh, a1, d1, Count)                           \
+    do                                                                  \
+    {                                                                   \
+        NV_PUSH_DATA(NV_PUSH_METHOD(_INC_METHOD, SubCh, a1, Count));    \
+        NV_PUSH_DATA(d1);                                               \
+    } while (0)
+
+#define NV_PUSH_INC_1U(SubCh, a1, d1)                                   \
+    do                                                                  \
+    {                                                                   \
+        _NV_PUSH_INC_1U (SubCh, a1, d1, 1);                             \
+    } while (0)
+
+#define NV_PUSH_INC_2U(SubCh, a1, d1, a2, d2)                           \
+    do                                                                  \
+    {                                                                   \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a1, a2);                           \
+        _NV_PUSH_INC_1U(SubCh, a1, d1, 2);                              \
+        NV_PUSH_DATA(d2);                                               \
+    } while (0)
+
+#define NV_PUSH_INC_3U(SubCh, a1, d1, a2, d2, a3, d3)                   \
+    do                                                                  \
+    {                                                                   \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a1, a2);                           \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a2, a3);                           \
+        _NV_PUSH_INC_1U(SubCh, a1, d1, 3);                              \
+        NV_PUSH_DATA(d2);                                               \
+        NV_PUSH_DATA(d3);                                               \
+    } while (0)
+
+#define NV_PUSH_INC_4U(SubCh, a1, d1, a2, d2, a3, d3, a4, d4)           \
+    do                                                                  \
+    {                                                                   \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a1, a2);                           \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a2, a3);                           \
+        _NV_ASSERT_CONTIGUOUS_METHOD(a3, a4);                           \
+        _NV_PUSH_INC_1U(SubCh, a1, d1, 4);                              \
+        NV_PUSH_DATA(d2);                                               \
+        NV_PUSH_DATA(d3);                                               \
+        NV_PUSH_DATA(d4);                                               \
+    } while (0)
+
+#define READ_CHANNEL_PAYLOAD_SEMA(channel)       MEM_RD32((NvU8*)channel->pbCpuVA + \
+                                                  channel->finishPayloadOffset)
+
+#define READ_CHANNEL_PB_SEMA(channel)            MEM_RD32((NvU8*)channel->pbCpuVA + \
+                                                  channel->semaOffset)
+
+#define WRITE_CHANNEL_PB_SEMA(channel, val)      MEM_WR32((NvU8*)channel->pbCpuVA + \
+                                                  channel->semaOffset, val);
+
+#define WRITE_CHANNEL_PAYLOAD_SEMA(channel,val)  MEM_WR32((NvU8*)channel->pbCpuVA + \
+                                                  channel->finishPayloadOffset, val);
+
+// 
+// This struct contains parameters needed to send a pushbuffer for a CE
+// operation. This interface only supports contiguous operations. 
+//
+typedef struct 
+{
+    NvBool bCeMemcopy;   // Whether this is a CE memcopy; 
+                         // If set to false, this will be a memset operation
+    NvU64 dstAddr;       // Physical address of the source address
+    NvU64 srcAddr;       // Physical address of the source address; only valid for memcopy
+    NvU32 size;
+    NvU32 pattern;       // Fixed pattern to memset to. Only valid for memset
+    NvU32 payload;       // Payload value used to release semaphore
+    NvU64 clientSemaAddr;
+    NV_ADDRESS_SPACE dstAddressSpace;
+    NV_ADDRESS_SPACE srcAddressSpace;
+    NvU32 dstCpuCacheAttrib;
+    NvU32 srcCpuCacheAttrib;
+} CHANNEL_PB_INFO;
+
+NV_STATUS channelSetupIDs(OBJCHANNEL *pChannel, OBJGPU *pGpu, NvBool bUseVasForCeCopy, NvBool bMIGInUse);
+void channelSetupChannelBufferSizes(OBJCHANNEL *pChannel);
+
+// Needed for pushbuffer management
+NV_STATUS channelWaitForFreeEntry(OBJCHANNEL *pChannel, NvU32 *pPutIndex);
+NV_STATUS channelFillGpFifo(OBJCHANNEL *pChannel, NvU32 putIndex, NvU32 methodsLength);
+NvU32 channelFillPb(OBJCHANNEL *pChannel, NvU32 putIndex, NvBool bPipelined,
+                    NvBool bInsertFinishPayload, CHANNEL_PB_INFO *pChannelPbInfo);
+NvU32 channelFillPbFastScrub(OBJCHANNEL *pChannel, NvU32 putIndex, NvBool bPipelined,
+                    NvBool bInsertFinishPayload, CHANNEL_PB_INFO *pChannelPbInfo);
+
+// Needed for work tracking
+NV_STATUS channelWaitForFinishPayload(OBJCHANNEL *pChannel, NvU64 targetPayload);
+NvU64 channelGetFinishPayload(OBJCHANNEL *pChannel);
+
+#endif // _CHANNEL_UTILS_H_
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/heap_base.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/heap_base.h
@@ -125,7 +125,7 @@ typedef struct PMA_ALLOC_INFO
 {
    NvBool bContig;
    NvU32  pageCount;
-    NvU32  pageSize;
+    NvU64  pageSize;
    NvU32  refCount;
    NvU64  allocSize;
    NvU32  flags;
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/mem_scrub.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/mem_scrub.h
@@ -34,16 +34,18 @@

 #include "nvctassert.h"
 #include "vgpu/vgpu_guest_pma_scrubber.h"
+#if !defined(SRT_BUILD)
+#include "gpu/mem_mgr/ce_utils.h"
+#endif

 struct OBJGPU;
 struct Heap;
 struct OBJCHANNEL;

-#define RM_SUBCHANNEL                             0x0
 #define MEMSET_PATTERN                            0x00000000
 #define SCRUBBER_NUM_PAYLOAD_SEMAPHORES           (2)
 #define SCRUBBER_SEMAPHORE_SIZE_INBYTES           (4)
-#define SCRUBBER_CHANNEL_SEMAPHORE_SIZE           (SCRUBBER_SEMAPHORE_SIZE_INBYTES *\
+#define SCRUBBER_CHANNEL_SEMAPHORE_SIZE           (SCRUBBER_SEMAPHORE_SIZE_INBYTES * \
                                                  SCRUBBER_NUM_PAYLOAD_SEMAPHORES)
 #define SCRUBBER_CHANNEL_NOTIFIER_SIZE            (sizeof(NvNotification) * NV_CHANNELGPFIFO_NOTIFICATION_TYPE__SIZE_1)

@@ -52,67 +54,6 @@ struct OBJCHANNEL;
 #define SCRUB_MAX_BYTES_PER_LINE                  0xffffffffULL
 #define MAX_SCRUB_ITEMS                           4096 // 4K scrub items

-#define READ_SCRUBBER_PAYLOAD_SEMA(channel)       MEM_RD32((NvU8*)channel->pbCpuVA +\
-                                                  channel->finishPayloadOffset)
-
-#define READ_SCRUBBER_PB_SEMA(channel)            MEM_RD32((NvU8*)channel->pbCpuVA +\
-                                                  channel->semaOffset)
-
-#define WRITE_SCRUBBER_PB_SEMA(channel, val)      MEM_WR32((NvU8*)channel->pbCpuVA +\
-                                                  channel->semaOffset, val);
-
-#define WRITE_SCRUBBER_PAYLOAD_SEMA(channel,val)  MEM_WR32((NvU8*)channel->pbCpuVA +\
-                                                  channel->finishPayloadOffset, val);
-// Use Incrementing Methods to save the PB Space
-#define _NV_ASSERT_CONTIGUOUS_METHODS(a1, a2)     NV_ASSERT((a2) - (a1) == 4)
-
-#define NV_PUSH_METHOD(OpType, SubCh, Method, Count)                                                      \
-                                                  (DRF_DEF(906F, _DMA, _SEC_OP, OpType)                 |\
-                                                  DRF_NUM(906F, _DMA, _METHOD_ADDRESS,    (Method) >> 2) |\
-                                                  DRF_NUM(906F, _DMA, _METHOD_SUBCHANNEL, (SubCh))       |\
-                                                  DRF_NUM(906F, _DMA, _METHOD_COUNT,      (Count)))
-
-#define NV_PUSH_DATA(Data)                        MEM_WR32(pPtr++, (Data))
-
-#define _NV_PUSH_INC_1U(SubCh, a1,d1, Count)                                                                          \
-                                                  do{                                                               \
-                                                        NV_PUSH_DATA(NV_PUSH_METHOD(_INC_METHOD, SubCh, a1, Count));\
-                                                        NV_PUSH_DATA(d1);                                           \
-                                                    } while(0)
-
-#define NV_PUSH_INC_1U(SubCh, a1,d1)                                                      \
-                                                  do{                                     \
-                                                        _NV_PUSH_INC_1U (SubCh, a1,d1, 1);\
-                                                    } while(0)
-
-#define NV_PUSH_INC_2U(SubCh, a1,d1, a2,d2)                                                    \
-                                                  do{                                          \
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a1, a2);\
-                                                        _NV_PUSH_INC_1U(SubCh, a1,d1, 2);      \
-                                                        NV_PUSH_DATA(d2);                      \
-                                                    } while(0)
-
-#define NV_PUSH_INC_3U(SubCh, a1,d1, a2,d2, a3,d3)                                            \
-                                                  do{                                         \
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a1,a2);\
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a2,a3);\
-                                                        _NV_PUSH_INC_1U(SubCh, a1,d1, 3);     \
-                                                        NV_PUSH_DATA(d2);                     \
-                                                        NV_PUSH_DATA(d3);                     \
-                                                    } while(0)
-
-#define NV_PUSH_INC_4U(SubCh, a1,d1, a2,d2, a3,d3, a4,d4)                                    \
-                                                  do{                                        \
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a1,a2);\
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a2,a3);\
-                                                        _NV_ASSERT_CONTIGUOUS_METHODS(a3,a4);\
-                                                        _NV_PUSH_INC_1U(SubCh, a1,d1, 4);    \
-                                                        NV_PUSH_DATA(d2);                    \
-                                                        NV_PUSH_DATA(d3);                    \
-                                                        NV_PUSH_DATA(d4);                    \
-                                                    } while(0)
-
-
 // structure to store the details of a scrubbing work
 typedef struct SCRUB_NODE {
    // The 64 bit ID assigned to each work
@@ -144,8 +85,10 @@ typedef struct OBJMEMSCRUB {
    NvLength                           scrubListSize;
    // Pre-allocated Free Scrub List
    PSCRUB_NODE                        pScrubList;
-    // Scrubber Channel
-    struct OBJCHANNEL *pChannel;
+#if !defined(SRT_BUILD)
+    // Scrubber uses ceUtils to manage CE channel
+    CeUtils                            ceUtilsObject;
+#endif
    struct OBJGPU                     *pGpu;
    VGPU_GUEST_PMA_SCRUB_BUFFER_RING   vgpuScrubBuffRing;
    NvBool                             bVgpuScrubberEnabled;
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/mem_utils.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/mem_utils.h
@@ -26,12 +26,12 @@

 #include "core/prelude.h"

-#define CLEAR_HAL_ATTR(a) \
+#define CLEAR_HAL_ATTR(a)                         \
    a = (a &~(DRF_NUM(OS32, _ATTR, _COMPR, 0x3) | \
              DRF_NUM(OS32, _ATTR, _TILED, 0x3) | \
              DRF_NUM(OS32, _ATTR, _ZCULL, 0x3)));

-#define CLEAR_HAL_ATTR2(a) \
+#define CLEAR_HAL_ATTR2(a)                       \
    a = (a & ~(DRF_SHIFTMASK(NVOS32_ATTR2_ZBC) | \
               DRF_SHIFTMASK(NVOS32_ATTR2_GPU_CACHEABLE)));

--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/addrtree.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/addrtree.h
@@ -127,12 +127,12 @@ void pmaAddrtreeSetEvictingFrames(void *pMap, NvU64 frameEvictionsInProcess);
 */
 NV_STATUS pmaAddrtreeScanContiguous(
    void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-    NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+    NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
    NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);

 NV_STATUS pmaAddrtreeScanDiscontiguous(
    void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-    NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+    NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
    NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);

 void pmaAddrtreePrintTree(void *pMap, const char* str);
@@ -154,7 +154,7 @@ void pmaAddrtreePrintTree(void *pMap, const char* str);
 void pmaAddrtreeChangeState(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState);
 void pmaAddrtreeChangeStateAttrib(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState, NvBool writeAttrib);
 void pmaAddrtreeChangeStateAttribEx(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState,PMA_PAGESTATUS newStateMask);
-void pmaAddrtreeChangePageStateAttrib(void * pMap, NvU64 startFrame, NvU32 pageSize,
+void pmaAddrtreeChangePageStateAttrib(void * pMap, NvU64 startFrame, NvU64 pageSize,
                                      PMA_PAGESTATUS newState, NvBool writeAttrib);

 /*!
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/map_defines.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/map_defines.h
@@ -90,7 +90,7 @@ typedef NvU32 PMA_PAGESTATUS;
 #define ATTRIB_PERSISTENT  NVBIT(MAP_IDX_PERSISTENT)
 #define ATTRIB_NUMA_REUSE  NVBIT(MAP_IDX_NUMA_REUSE)
 #define ATTRIB_BLACKLIST   NVBIT(MAP_IDX_BLACKLIST)
-#define ATTRIB_MASK        (ATTRIB_EVICTING | ATTRIB_SCRUBBING \
+#define ATTRIB_MASK        (ATTRIB_EVICTING | ATTRIB_SCRUBBING      \
                            | ATTRIB_PERSISTENT | ATTRIB_NUMA_REUSE \
                            | ATTRIB_BLACKLIST)

@@ -114,6 +114,9 @@ typedef struct _PMA_STATS
    NvU64 numFreeFrames;             // PMA-wide free 64KB frame count
    NvU64 numFree2mbPages;           // PMA-wide free 2MB pages count
 #if !defined(NVWATCH)
+    NvU64 num2mbPagesProtected;      // PMA-wide total number of 2MB pages in protected memory
+    NvU64 numFreeFramesProtected;    // PMA-wide free 64KB frame count in protected memory
+    NvU64 numFree2mbPagesProtected;  // PMA-wide free 2MB pages count in protected memory
 #endif // !defined(NVWATCH)
 } PMA_STATS;

--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/numa.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/numa.h
@@ -59,7 +59,7 @@ extern "C" {
 * is used for allocations coming from the Linux kernel.
 * The perf implication is under further study. See bug #1999793.
 */
-NV_STATUS pmaNumaAllocate(PMA *pPma, NvLength allocationCount, NvU32 pageSize,
+NV_STATUS pmaNumaAllocate(PMA *pPma, NvLength allocationCount, NvU64 pageSize,
    PMA_ALLOCATION_OPTIONS *allocationOptions, NvU64 *pPages);

 /*!
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/phys_mem_allocator.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/phys_mem_allocator.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2015-2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 2015-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -73,6 +73,7 @@ typedef struct SCRUB_NODE SCRUB_NODE;
 #define PMA_INIT_INTERNAL               NVBIT(3) // Used after heap is removed
 #define PMA_INIT_FORCE_PERSISTENCE      NVBIT(4)
 #define PMA_INIT_ADDRTREE               NVBIT(5)
+#define PMA_INIT_NUMA_AUTO_ONLINE       NVBIT(6)

 // These flags are used for querying PMA's config and/or state.
 #define PMA_QUERY_SCRUB_ENABLED         NVBIT(0)
@@ -166,7 +167,7 @@ typedef enum
 /*!
 * @brief Callbacks to UVM for eviction
 */
-typedef NV_STATUS (*pmaEvictPagesCb_t)(void *ctxPtr, NvU32 pageSize, NvU64 *pPages,
+typedef NV_STATUS (*pmaEvictPagesCb_t)(void *ctxPtr, NvU64 pageSize, NvU64 *pPages,
                                       NvU32 count, NvU64 physBegin, NvU64 physEnd,
                                       MEMORY_PROTECTION prot);
 typedef NV_STATUS (*pmaEvictRangeCb_t)(void *ctxPtr, NvU64 physBegin, NvU64 physEnd,
@@ -180,13 +181,13 @@ typedef void  (*pmaMapDestroy_t)(void *pMap);
 typedef void  (*pmaMapChangeState_t)(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState);
 typedef void  (*pmaMapChangeStateAttrib_t)(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState, NvBool writeAttrib);
 typedef void  (*pmaMapChangeStateAttribEx_t)(void *pMap, NvU64 frameNum, PMA_PAGESTATUS newState, PMA_PAGESTATUS newStateMask);
-typedef void  (*pmaMapChangePageStateAttrib_t)(void *pMap, NvU64 startFrame, NvU32 pageSize, PMA_PAGESTATUS newState, NvBool writeAttrib);
+typedef void  (*pmaMapChangePageStateAttrib_t)(void *pMap, NvU64 startFrame, NvU64 pageSize, PMA_PAGESTATUS newState, NvBool writeAttrib);
 typedef PMA_PAGESTATUS (*pmaMapRead_t)(void *pMap, NvU64 frameNum, NvBool readAttrib);
 typedef NV_STATUS (*pmaMapScanContiguous_t)(void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-                                            NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+                                            NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
                                            NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);
 typedef NV_STATUS (*pmaMapScanDiscontiguous_t)(void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-                                               NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+                                               NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
                                               NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);
 typedef void (*pmaMapGetSize_t)(void *pMap, NvU64 *pBytesTotal);
 typedef void (*pmaMapGetLargestFree_t)(void *pMap, NvU64 *pLargestFree);
@@ -251,6 +252,7 @@ struct _PMA
    NvU64                   coherentCpuFbBase;                  // Used to calculate FB offset from bus address
    NvU64                   coherentCpuFbSize;                  // Used for error checking only
    NvU32                   numaReclaimSkipThreshold;           // percent value below which __GFP_RECLAIM will not be used.
+    NvBool                  bNumaAutoOnline;                    // If NUMA memory is auto-onlined

    // Blacklist related states
    PMA_BLACKLIST_CHUNK    *pBlacklistChunks;                   // Tracking for blacklist pages
@@ -433,12 +435,12 @@ NV_STATUS pmaRegisterRegion(PMA *pPma, NvU32 id, NvBool bAsyncEccScrub,
 *          code,because it is not very informative.
 *
 */
-NV_STATUS pmaAllocatePages(PMA *pPma, NvLength pageCount, NvU32 pageSize,
+NV_STATUS pmaAllocatePages(PMA *pPma, NvLength pageCount, NvU64 pageSize,
    PMA_ALLOCATION_OPTIONS *pAllocationOptions, NvU64 *pPages);

 // allocate on multiple GPU, thus pmaCount
 NV_STATUS pmaAllocatePagesBroadcast(PMA **pPma, NvU32 pmaCount, NvLength allocationCount,
-    NvU32 pageSize, PMA_ALLOCATION_OPTIONS *pAllocationOptions, NvU64 *pPages);
+    NvU64 pageSize, PMA_ALLOCATION_OPTIONS *pAllocationOptions, NvU64 *pPages);


 /*!
@@ -472,7 +474,7 @@ NV_STATUS pmaAllocatePagesBroadcast(PMA **pPma, NvU32 pmaCount, NvLength allocat
 *      TODO some error for rollback
 *
 */
-NV_STATUS pmaPinPages(PMA *pPma, NvU64 *pPages, NvLength pageCount, NvU32 pageSize);
+NV_STATUS pmaPinPages(PMA *pPma, NvU64 *pPages, NvLength pageCount, NvU64 pageSize);


 /*!
@@ -498,7 +500,7 @@ NV_STATUS pmaPinPages(PMA *pPma, NvU64 *pPages, NvLength pageCount, NvU32 pageSi
 *      TODO some error for rollback
 *
 */
-NV_STATUS pmaUnpinPages(PMA *pPma, NvU64 *pPages, NvLength pageCount, NvU32 pageSize);
+NV_STATUS pmaUnpinPages(PMA *pPma, NvU64 *pPages, NvLength pageCount, NvU64 pageSize);


 /*!
@@ -815,7 +817,7 @@ void pmaNumaOfflined(PMA *pPma);
 * @return
 *     void
 */
-void pmaGetClientBlacklistedPages(PMA *pPma, NvU64 *pChunks, NvU32 *pPageSize, NvU32 *pNumChunks);
+void pmaGetClientBlacklistedPages(PMA *pPma, NvU64 *pChunks, NvU64 *pPageSize, NvU32 *pNumChunks);

 /*!
 * @brief Returns the PMA blacklist size in bytes for
@@ -865,6 +867,54 @@ void pmaPrintMapState(PMA *pPma);
 */
 NV_STATUS pmaAddToBlacklistTracking(PMA *pPma, NvU64 physBase);

+/*!
+ * @brief Returns total protected video memory.
+ *
+ * @param[in]  pPma           PMA pointer
+ * @param[in]  pBytesTotal    Pointer that will return the total FB memory size.
+ *
+ * @return
+ *      void
+ */
+void pmaGetTotalProtectedMemory(PMA *pPma, NvU64 *pBytesTotal);
+
+/*!
+ * @brief Returns total unprotected video memory.
+ *
+ * @param[in]  pPma           PMA pointer
+ * @param[in]  pBytesTotal    Pointer that will return the total FB memory size.
+ *
+ * @return
+ *      void
+ */
+void pmaGetTotalUnprotectedMemory(PMA *pPma, NvU64 *pBytesTotal);
+
+/*!
+ * @brief Returns information about the total free protected FB memory.
+ *        In confidential compute use cases, memory will be split into
+ *        protected and unprotected regions
+ *
+ * @param[in]  pPma           PMA pointer
+ * @param[in]  pBytesFree     Pointer that will return the free protected memory size.
+ *
+ * @return
+ *      void
+ */
+void pmaGetFreeProtectedMemory(PMA *pPma, NvU64 *pBytesFree);
+
+/*!
+ * @brief Returns information about the total free unprotected FB memory.
+ *        In confidential compute use cases, memory will be split into
+ *        protected and unprotected regions
+ *
+ * @param[in]  pPma           PMA pointer
+ * @param[in]  pBytesFree     Pointer that will return the free unprotected memory size.
+ *
+ * @return
+ *      void
+ */
+void pmaGetFreeUnprotectedMemory(PMA *pPma, NvU64 *pBytesFree);
+
 #ifdef __cplusplus
 }
 #endif
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/phys_mem_allocator_util.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/phys_mem_allocator_util.h
@@ -45,11 +45,11 @@ NvBool pmaStateCheck(PMA *pPma);
 NV_STATUS _pmaEvictContiguous(PMA *pPma, void *pMap, NvU64 evictStart, NvU64 evictEnd,
                              MEMORY_PROTECTION prot);
 NV_STATUS _pmaEvictPages(PMA *pPma, void *pMap, NvU64 *evictPages, NvU64 evictPageCount,
-                         NvU64 *allocPages, NvU64 allocPageCount, NvU32 pageSize,
+                         NvU64 *allocPages, NvU64 allocPageCount, NvU64 pageSize,
                         NvU64 physBegin, NvU64 physEnd, MEMORY_PROTECTION prot);
 void      _pmaClearScrubBit(PMA *pPma, SCRUB_NODE *pPmaScrubList, NvU64 count);
 NV_STATUS _pmaCheckScrubbedPages(PMA *pPma, NvU64 chunkSize, NvU64 *pPages, NvU32 pageCount);
-NV_STATUS _pmaPredictOutOfMemory(PMA *pPma, NvLength allocationCount, NvU32 pageSize,
+NV_STATUS _pmaPredictOutOfMemory(PMA *pPma, NvLength allocationCount, NvU64 pageSize,
                                 PMA_ALLOCATION_OPTIONS *allocationOptions);
 NV_STATUS pmaSelector(PMA *pPma, PMA_ALLOCATION_OPTIONS *allocationOptions, NvS32 *regionList);
 void      _pmaReallocBlacklistPages (PMA  *pPma, NvU32 regId, NvU64 rangeBegin, NvU64 rangeSize);
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/regmap.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/phys_mem_allocator/regmap.h
@@ -131,7 +131,7 @@ void pmaRegmapChangeStateAttrib(void *pMap, NvU64 frameNum,
 *
 * @return void
 */
-void pmaRegmapChangePageStateAttrib(void * pMap, NvU64 frameNumStart, NvU32 pageSize,
+void pmaRegmapChangePageStateAttrib(void * pMap, NvU64 frameNumStart, NvU64 pageSize,
                                    PMA_PAGESTATUS newState, NvBool writeAttrib);

 /*!
@@ -188,7 +188,7 @@ PMA_PAGESTATUS pmaRegmapRead(void *pMap, NvU64 frameNum, NvBool readAttrib);
 */
 NV_STATUS pmaRegmapScanContiguous(
    void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-    NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+    NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
    NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);

 /*!
@@ -215,7 +215,7 @@ NV_STATUS pmaRegmapScanContiguous(
 */
 NV_STATUS pmaRegmapScanDiscontiguous(
    void *pMap, NvU64 addrBase, NvU64 rangeStart, NvU64 rangeEnd,
-    NvU64 numPages, NvU64 *freelist, NvU32 pageSize, NvU64 alignment,
+    NvU64 numPages, NvU64 *freelist, NvU64 pageSize, NvU64 alignment,
    NvU64 *pagesAllocated, NvBool bSkipEvict, NvBool bReverseAlloc);

 /*!
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/rm_page_size.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/rm_page_size.h
@@ -0,0 +1,80 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef RM_PAGE_SIZE_H
+#define RM_PAGE_SIZE_H
+
+
+
+//---------------------------------------------------------------------------
+//
+//  Memory page defines.
+//
+//  These correspond to the granularity understood by the hardware
+//  for address mapping; the system page size can be larger.
+//
+//---------------------------------------------------------------------------
+#define RM_PAGE_SIZE_INVALID 0
+#define RM_PAGE_SIZE         4096
+#define RM_PAGE_SIZE_64K     (64 * 1024)
+#define RM_PAGE_SIZE_128K    (128 * 1024)
+#define RM_PAGE_MASK         0x0FFF
+#define RM_PAGE_SHIFT        12
+#define RM_PAGE_SHIFT_64K    16
+#define RM_PAGE_SHIFT_128K   17
+#define RM_PAGE_SHIFT_2M     21
+#define RM_PAGE_SIZE_2M      (1 << RM_PAGE_SHIFT_2M)
+
+// Huge page size is 2 MB
+#define RM_PAGE_SHIFT_HUGE RM_PAGE_SHIFT_2M
+#define RM_PAGE_SIZE_HUGE  (1ULL << RM_PAGE_SHIFT_HUGE)
+#define RM_PAGE_MASK_HUGE  ((1ULL << RM_PAGE_SHIFT_HUGE) - 1)
+
+// 512MB page size
+#define RM_PAGE_SHIFT_512M 29
+#define RM_PAGE_SIZE_512M  (1ULL << RM_PAGE_SHIFT_512M)
+#define RM_PAGE_MASK_512M  (RM_PAGE_SIZE_512M - 1)
+
+//---------------------------------------------------------------------------
+//
+//  Memory page attributes.
+//
+//  These attributes are used by software for page size mapping;
+//  Big pages can be of 64/128KB[Fermi/Kepler/Pascal]
+//  Huge page is 2 MB[Pascal+]
+//  512MB page is Ampere+
+//  Default page attribute lets driver decide the optimal page size
+//
+//---------------------------------------------------------------------------
+typedef enum
+{
+    RM_ATTR_PAGE_SIZE_DEFAULT,
+    RM_ATTR_PAGE_SIZE_4KB,
+    RM_ATTR_PAGE_SIZE_BIG,
+    RM_ATTR_PAGE_SIZE_HUGE,
+    RM_ATTR_PAGE_SIZE_512MB,
+    RM_ATTR_PAGE_SIZE_INVALID
+}
+RM_ATTR_PAGE_SIZE;
+
+#endif // RM_PAGE_SIZE_H
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/sem_surf.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/sem_surf.h
@@ -0,0 +1,3 @@
+
+#include "g_sem_surf_nvoc.h"
+
--- a/src/nvidia/inc/kernel/gpu/mem_mgr/virt_mem_allocator_common.h
+++ b/src/nvidia/inc/kernel/gpu/mem_mgr/virt_mem_allocator_common.h
@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 1993-2021 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-FileCopyrightText: Copyright (c) 1993-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: MIT
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
@@ -33,60 +33,14 @@
 #include "nvtypes.h"
 #include "nvgputypes.h"
 #include "nvstatus.h"
+#include "resserv/rs_client.h"
+#include "gpu/mem_mgr/rm_page_size.h"

 typedef struct OBJGPU OBJGPU;
 typedef struct ChannelDescendant ChannelDescendant;
 typedef struct ContextDma ContextDma;
 typedef struct Memory Memory;
 typedef struct EVENTNOTIFICATION EVENTNOTIFICATION;
-//---------------------------------------------------------------------------
-//
-//  Memory page defines.
-//
-//  These correspond to the granularity understood by the hardware
-//  for address mapping; the system page size can be larger.
-//
-//---------------------------------------------------------------------------
-#define RM_PAGE_SIZE_INVALID 0
-#define RM_PAGE_SIZE         4096
-#define RM_PAGE_SIZE_64K     (64 * 1024)
-#define RM_PAGE_SIZE_128K    (128 * 1024)
-#define RM_PAGE_MASK         0x0FFF
-#define RM_PAGE_SHIFT        12
-#define RM_PAGE_SHIFT_64K    16
-#define RM_PAGE_SHIFT_128K   17
-
-// Huge page size is 2 MB
-#define RM_PAGE_SHIFT_HUGE 21
-#define RM_PAGE_SIZE_HUGE  (1 << RM_PAGE_SHIFT_HUGE)
-#define RM_PAGE_MASK_HUGE  ((1 << RM_PAGE_SHIFT_HUGE) - 1)
-
-// 512MB page size
-#define RM_PAGE_SHIFT_512M 29
-#define RM_PAGE_SIZE_512M  (1 << RM_PAGE_SHIFT_512M)
-#define RM_PAGE_MASK_512M  (RM_PAGE_SIZE_512M - 1)
-
-//---------------------------------------------------------------------------
-//
-//  Memory page attributes.
-//
-//  These attributes are used by software for page size mapping;
-//  Big pages can be of 64/128KB[Fermi/Kepler/Pascal]
-//  Huge page is 2 MB[Pascal+]
-//  512MB page is Ampere+
-//  Default page attribute lets driver decide the optimal page size
-//
-//---------------------------------------------------------------------------
-typedef enum
-{
-    RM_ATTR_PAGE_SIZE_DEFAULT = 0x0,
-    RM_ATTR_PAGE_SIZE_4KB     = 0x1,
-    RM_ATTR_PAGE_SIZE_BIG     = 0x2,
-    RM_ATTR_PAGE_SIZE_HUGE    = 0x3,
-    RM_ATTR_PAGE_SIZE_512MB   = 0x4,
-    RM_ATTR_PAGE_SIZE_INVALID = 0x5
-}
-RM_ATTR_PAGE_SIZE;

 //---------------------------------------------------------------------------
 //
@@ -133,8 +87,8 @@ void notifyFillNOTIFICATION(OBJGPU       *pGpu,
                            NV_STATUS     CompletionStatus,
                            NvBool        TimeSupplied,
                            NvU64         Time);
-NV_STATUS notifyFillNotifierGPUVA          (OBJGPU*, NvHandle, NvHandle, NvU64, NvV32, NvV16, NV_STATUS, NvU32);
-NV_STATUS notifyFillNotifierGPUVATimestamp (OBJGPU*, NvHandle, NvHandle, NvU64, NvV32, NvV16, NV_STATUS, NvU32, NvU64);
+NV_STATUS notifyFillNotifierGPUVA          (OBJGPU*, RsClient*, NvHandle, NvU64, NvV32, NvV16, NV_STATUS, NvU32);
+NV_STATUS notifyFillNotifierGPUVATimestamp (OBJGPU*, RsClient*, NvHandle, NvU64, NvV32, NvV16, NV_STATUS, NvU32, NvU64);
 NV_STATUS notifyFillNotifierMemory         (OBJGPU*, Memory *, NvV32, NvV16, NV_STATUS, NvU32);
 NV_STATUS notifyFillNotifierMemoryTimestamp(OBJGPU*, Memory *, NvV32, NvV16, NV_STATUS, NvU32, NvU64);
 void notifyFillNvNotification(OBJGPU         *pGpu,
@@ -145,8 +99,8 @@ void notifyFillNvNotification(OBJGPU         *pGpu,
                              NvBool          TimeSupplied,
                              NvU64           Time);

-NV_STATUS semaphoreFillGPUVA         (OBJGPU*, NvHandle, NvHandle, NvU64, NvV32, NvV32, NvBool);
-NV_STATUS semaphoreFillGPUVATimestamp(OBJGPU*, NvHandle, NvHandle, NvU64, NvV32, NvV32, NvBool, NvU64);
+NV_STATUS semaphoreFillGPUVA         (OBJGPU*, RsClient*, NvHandle, NvU64, NvV32, NvV32, NvBool);
+NV_STATUS semaphoreFillGPUVATimestamp(OBJGPU*, RsClient*, NvHandle, NvU64, NvV32, NvV32, NvBool, NvU64);

 RM_ATTR_PAGE_SIZE dmaNvos32ToPageSizeAttr(NvU32 attr, NvU32 attr2);

--- a/src/nvidia/inc/kernel/gpu/perf/kern_perf_boost.h
+++ b/src/nvidia/inc/kernel/gpu/perf/kern_perf_boost.h
@@ -67,7 +67,7 @@ typedef struct
    NvU32       flags;

    /*!
-     * Specifies number of clients who requested 
+     * Specifies number of clients who requested
     * CUDA boost. This is used only in case of the CUDA clients.
     */
    NvU32       refCount;
--- a/src/nvidia/inc/kernel/gpu/perf/kern_perf_gpuboostsync.h
+++ b/src/nvidia/inc/kernel/gpu/perf/kern_perf_gpuboostsync.h
@@ -50,7 +50,7 @@ struct KERNEL_PERF_GPU_BOOST_SYNC
     */
    NvBool  bHystersisEnable;

-    /*! 
+    /*!
     * SLI GPU Boost feature is enabled.
     */
    NvBool  bSliGpuBoostSyncEnable;
--- a/src/nvidia/inc/kernel/gpu/sec2/sec2_context.h
+++ b/src/nvidia/inc/kernel/gpu/sec2/sec2_context.h
@@ -0,0 +1,3 @@
+
+#include "g_sec2_context_nvoc.h"
+
--- a/src/nvidia/inc/kernel/gpu/spdm/libspdm_includes.h
+++ b/src/nvidia/inc/kernel/gpu/spdm/libspdm_includes.h
@@ -0,0 +1,74 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2021-2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef LIBSPDM_INCLUDES_H
+#define LIBSPDM_INCLUDES_H
+
+//
+// Dedicated header file to centralize all libspdm-related includes and defines.
+// This allows us to minimize the amount of headers (and sources) that have direct
+// libspdm dependency, and allowing shared macros & types for dependent source.
+//
+
+/* ------------------------ Includes --------------------------------------- */
+#include "internal/libspdm_common_lib.h"
+#include "internal/libspdm_secured_message_lib.h"
+#include "library/spdm_requester_lib.h"
+
+/* ------------------------ Macros and Defines ----------------------------- */
+//
+// As libspdm has its own RETURN_STATUS define, we need to ensure we do not
+// accidentally compare it against NV_STATUS. Use macro for consistent libspdm
+// error handling.
+//
+#define CHECK_SPDM_STATUS(expr) do {                                    \
+         libspdm_return_t __spdmStatus;                                 \
+         __spdmStatus = (expr);                                         \
+         if (LIBSPDM_STATUS_IS_ERROR(__spdmStatus))                     \
+         {                                                              \
+             NV_PRINTF(LEVEL_INFO, "SPDM failed with status 0x%0x\n",   \
+                       __spdmStatus);                                   \
+             status = NV_ERR_GENERIC;                                   \
+             goto ErrorExit;                                            \
+         }                                                              \
+     } while (NV_FALSE)
+
+// Check for any critical issues caused by data size mismatches.
+ct_assert(sizeof(NvU8)  == sizeof(uint8_t));
+ct_assert(sizeof(NvU16) == sizeof(uint16_t));
+ct_assert(sizeof(NvU32) == sizeof(uint32_t));
+ct_assert(sizeof(NvU64) == sizeof(uint64_t));
+
+typedef struct _SPDM_ALGO_CHECK_ENTRY
+{
+    libspdm_data_type_t dataType;
+    uint32_t            expectedAlgo;
+} SPDM_ALGO_CHECK_ENTRY, *PSPDM_ALGO_CHECK_ENTRY;
+
+//
+// Check for assert in libspdm code, indicating a fatal condition.
+// Returns false if assert was hit.
+//
+bool nvspdm_check_and_clear_libspdm_assert(void);
+
+#endif // LIBSPDM_INCLUDES_H
--- a/src/nvidia/inc/kernel/gpu/spdm/spdm.h
+++ b/src/nvidia/inc/kernel/gpu/spdm/spdm.h
@@ -0,0 +1,3 @@
+
+#include "g_spdm_nvoc.h"
+
--- a/src/nvidia/inc/kernel/gpu/subdevice/subdevice_ctrl_rc.h
+++ b/src/nvidia/inc/kernel/gpu/subdevice/subdevice_ctrl_rc.h
@@ -51,24 +51,24 @@
    NV_STATUS subdeviceCtrlCmdRcSetCleanErrorHistory(Subdevice *pSubdevice);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_RC_GET_WATCHDOG_INFO,
-                  RMCTRL_FLAGS(NON_PRIVILEGED))
+                  RMCTRL_FLAGS(NON_PRIVILEGED, GPU_LOCK_DEVICE_ONLY, API_LOCK_READONLY))
    NV_STATUS subdeviceCtrlCmdRcGetWatchdogInfo(Subdevice *pSubdevice,
        NV2080_CTRL_RC_GET_WATCHDOG_INFO_PARAMS *pWatchdogInfoParams);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_RC_DISABLE_WATCHDOG,
-                  RMCTRL_FLAGS(NON_PRIVILEGED))
+                  RMCTRL_FLAGS(NON_PRIVILEGED, GPU_LOCK_DEVICE_ONLY))
    NV_STATUS subdeviceCtrlCmdRcDisableWatchdog(Subdevice *pSubdevice);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_RC_SOFT_DISABLE_WATCHDOG,
-                  RMCTRL_FLAGS(NON_PRIVILEGED))
+                  RMCTRL_FLAGS(NON_PRIVILEGED, GPU_LOCK_DEVICE_ONLY))
    NV_STATUS subdeviceCtrlCmdRcSoftDisableWatchdog(Subdevice *pSubdevice);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_RC_ENABLE_WATCHDOG,
-                  RMCTRL_FLAGS(NON_PRIVILEGED))
+                  RMCTRL_FLAGS(NON_PRIVILEGED, GPU_LOCK_DEVICE_ONLY))
    NV_STATUS subdeviceCtrlCmdRcEnableWatchdog(Subdevice *pSubdevice);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_RC_RELEASE_WATCHDOG_REQUESTS,
-                  RMCTRL_FLAGS(NON_PRIVILEGED))
+                  RMCTRL_FLAGS(NON_PRIVILEGED, GPU_LOCK_DEVICE_ONLY))
    NV_STATUS subdeviceCtrlCmdRcReleaseWatchdogRequests(Subdevice *pSubdevice);

    RMCTRL_EXPORT(NV2080_CTRL_CMD_INTERNAL_RC_WATCHDOG_TIMEOUT,