doca-docs/gpunetio__dma__memcpy__sample_8c_source.html

 /*

  * Copyright (c) 2024 NVIDIA CORPORATION AND AFFILIATES.  All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without modification, are permitted

  * provided that the following conditions are met:

  *     * Redistributions of source code must retain the above copyright notice, this list of

  *       conditions and the following disclaimer.

  *     * Redistributions in binary form must reproduce the above copyright notice, this list of

  *       conditions and the following disclaimer in the documentation and/or other materials

  *       provided with the distribution.

  *     * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used

  *       to endorse or promote products derived from this software without specific prior written

  *       permission.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR

  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND

  * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE

  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;

  * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,

  * STRICT LIABILITY, OR TOR (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  */


 #include <unistd.h>

 #include <time.h>

 #include <stdbool.h>


 #include <doca_log.h>

 #include <doca_buf.h>

 #include <doca_buf_inventory.h>

 #include <doca_mmap.h>

 #include <doca_pe.h>


 #include "gpunetio_dma_common.h"


 #define SLEEP_IN_NANOS (10 * 1000)

 #define GPU_PAGE_SIZE (1UL << 16)

 #define NUM_TASKS 1

 #define NUM_BUFS 2

 #define DEFAULT_VALUE 0


 /* Global flag indicating the task status */

 static uint8_t is_task_done = 0;


 DOCA_LOG_REGISTER(GPU_DMA_MEMCPY::SAMPLE);


 /*

  * Sample objects

  */

 struct gpu_dma_sample_objects {

     struct program_core_objects core_objs;         /* Core objects */

     struct doca_dma *dma;                  /* DOCA DMA instance */

     struct doca_gpu_dma *dma_gpu;              /* DOCA DMA GPU instance */

     struct doca_gpu *gpu_dev;              /* DOCA GPU device */

     struct doca_buf *src_doca_buf;             /* src doca buffer - CPU memory */

     struct doca_buf *dst_doca_buf;             /* dst doca buffer - GPU memory */

     struct doca_buf_arr *src_doca_buf_arr;         /* src doca buffer - GPU memory */

     struct doca_buf_arr *dst_doca_buf_arr;         /* dst doca buffer - CPU memory */

     struct doca_gpu_buf_arr *src_doca_gpu_buf_arr; /* src GPU doca buffer - GPU memory */

     struct doca_gpu_buf_arr *dst_doca_gpu_buf_arr; /* dst GPU doca buffer - CPU memory */

     char *src_buffer;                  /* src buffer address - CPU memory */

     char *dst_buffer;                  /* dst buffer address - GPU memory */

     bool gpu_datapath;                 /* Enable GPU datapath */

 };


 /*

  * DMA memcpy task common callback

  *

  * @dma_task [in]: DMA task

  * @task_user_data [in]: Task user data

  * @ctx_user_data [in]: Context user data

  */

 static void memcpy_task_common_callback(struct doca_dma_task_memcpy *dma_task,

                     union doca_data task_user_data,

                     union doca_data ctx_user_data)

 {

     (void)dma_task;

     (void)task_user_data;

     (void)ctx_user_data;


     /* Set a flag to notify upon completion of a task */

     is_task_done = 1;

 }


 /*

  * Initialize DOCA device

  *

  * @nic_pcie_addr [in]: Network card PCIe address

  * @ddev [out]: DOCA device

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 static doca_error_t init_doca_device(char *nic_pcie_addr, struct doca_dev **ddev)

 {

     doca_error_t status;


     if (nic_pcie_addr == NULL || ddev == NULL)

         return DOCA_ERROR_INVALID_VALUE;


     status = open_doca_device_with_pci(nic_pcie_addr, NULL, ddev);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to open DOCA device based on NIC PCI address");

         return status;

     }


     return DOCA_SUCCESS;

 }


 /*

  * Initialize sample memory objects

  *

  * @state [in]: Sample objects

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 static doca_error_t init_sample_mem_objs(struct gpu_dma_sample_objects *state)

 {

     doca_error_t status;

     char *tmp_cpu;


     if (state->gpu_datapath) {

         /* Allocate GPU src buffer */

         status = doca_gpu_mem_alloc(state->gpu_dev,

                         DMA_MEMCPY_SIZE,

                         GPU_PAGE_SIZE,

                         DOCA_GPU_MEM_TYPE_GPU_CPU, // GDRCopy

                         (void **)&state->src_buffer,

                         (void **)&tmp_cpu);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to initialize memory objects: Unable to allocate gpu memory: %s",

                      doca_error_get_descr(status));

             return status;

         }


         /* Copy data to src buffer */

         strcpy(tmp_cpu, "This is a sample piece of text from GPU");


         DOCA_LOG_INFO("The GPU source buffer value to be copied to CPU memory: %s", tmp_cpu);


         status = doca_mmap_create(&state->core_objs.src_mmap);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to create source mmap: %s", doca_error_get_descr(status));

             return status;

         }

         status = doca_mmap_add_dev(state->core_objs.src_mmap, state->core_objs.dev);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to add device to source mmap: %s", doca_error_get_descr(status));

             return status;

         }


         /* Allocate CPU dst buffer */

         state->dst_buffer = (char *)malloc(DMA_MEMCPY_SIZE);

         if (state->dst_buffer == NULL) {

             DOCA_LOG_ERR("Failed to initialize memory objects: Unable to allocate cpu memory");

             return DOCA_ERROR_NO_MEMORY;

         }


         memset(state->dst_buffer, DEFAULT_VALUE, DMA_MEMCPY_SIZE);


         status = doca_mmap_create(&state->core_objs.dst_mmap);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to create destination mmap: %s", doca_error_get_descr(status));

             return status;

         }

         status = doca_mmap_add_dev(state->core_objs.dst_mmap, state->core_objs.dev);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to add device to destination mmap: %s", doca_error_get_descr(status));

             return status;

         }


     } else {

         /* Create DOCA Core objects */

         status = create_core_objects(&(state->core_objs), NUM_BUFS);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to initialize memory objects: Failed to create core objects: %s",

                      doca_error_get_descr(status));

             return status;

         }


         /* Allocate CPU src buffer */

         state->src_buffer = (char *)malloc(DMA_MEMCPY_SIZE);

         if (state->src_buffer == NULL) {

             DOCA_LOG_ERR("Failed to initialize memory objects: Unable to allocate cpu memory");

             return DOCA_ERROR_NO_MEMORY;

         }


         /* Copy data to src buffer */

         strcpy(state->src_buffer, "This is a sample piece of text from CPU");


         /* Print the source buffer */

         DOCA_LOG_INFO("The CPU source buffer value to be copied to GPU memory: %s", state->src_buffer);


         /* Allocate GPU dst buffer */

         status = doca_gpu_mem_alloc(state->gpu_dev,

                         DMA_MEMCPY_SIZE,

                         GPU_PAGE_SIZE,

                         DOCA_GPU_MEM_TYPE_GPU,

                         (void **)&state->dst_buffer,

                         NULL);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to initialize memory objects: Unable to allocate gpu memory: %s",

                      doca_error_get_descr(status));

             return status;

         }

     }


     /* Set memory range in dst mmap with GPU memory address */

     status = doca_mmap_set_memrange(state->core_objs.dst_mmap, state->dst_buffer, DMA_MEMCPY_SIZE);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize memory objects: Unable to set memrange to dst mmap: %s",

                  doca_error_get_descr(status));

         return status;

     }


     /* Set memory range in src mmap with CPU memory address */

     status = doca_mmap_set_memrange(state->core_objs.src_mmap, state->src_buffer, DMA_MEMCPY_SIZE);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize memory objects: Unable to set memrange to src mmap: %s",

                  doca_error_get_descr(status));

         return status;

     }


     /* Start src mmap */

     status = doca_mmap_start(state->core_objs.src_mmap);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize memory objects: Unable to start src mmap: %s",

                  doca_error_get_descr(status));

         return status;

     }


     /* Start dst mmap */

     status = doca_mmap_start(state->core_objs.dst_mmap);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize memory objects: Unable to start dst mmap: %s",

                  doca_error_get_descr(status));

         return status;

     }


     if (state->gpu_datapath) {

         /* Create src GPU buffer array */

         status = doca_buf_arr_create(1, &state->src_doca_buf_arr);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca src_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_set_target_gpu(state->src_doca_buf_arr, state->gpu_dev);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca src_doca_buf_arr internal error");

             return status;

         }


         status =

             doca_buf_arr_set_params(state->src_doca_buf_arr, state->core_objs.src_mmap, DMA_MEMCPY_SIZE, 0);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca src_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_start(state->src_doca_buf_arr);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca src_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_get_gpu_handle(state->src_doca_buf_arr, &(state->src_doca_gpu_buf_arr));

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to get buff_arr GPU handle: %s", doca_error_get_descr(status));

             return status;

         }


         /* Create dst GPU buffer array */

         status = doca_buf_arr_create(1, &state->dst_doca_buf_arr);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca dst_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_set_target_gpu(state->dst_doca_buf_arr, state->gpu_dev);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca dst_doca_buf_arr internal error");

             return status;

         }


         status =

             doca_buf_arr_set_params(state->dst_doca_buf_arr, state->core_objs.dst_mmap, DMA_MEMCPY_SIZE, 0);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca dst_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_start(state->dst_doca_buf_arr);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to start buf: doca dst_doca_buf_arr internal error");

             return status;

         }


         status = doca_buf_arr_get_gpu_handle(state->dst_doca_buf_arr, &(state->dst_doca_gpu_buf_arr));

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Unable to get buff_arr GPU handle: %s", doca_error_get_descr(status));

             return status;

         }

     } else {

         /* Get a DOCA buffer from src mmap (CPU) */

         doca_buf_inventory_buf_get_by_data(state->core_objs.buf_inv,

                            state->core_objs.src_mmap,

                            state->src_buffer,

                            DMA_MEMCPY_SIZE,

                            &state->src_doca_buf);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR(

                 "Failed to initialize memory objects: Unable to acquire DOCA buffer representing src buffer: %s",

                 doca_error_get_descr(status));

             return status;

         }


         /* Get a DOCA buffer from dst mmap (GPU) */

         status = doca_buf_inventory_buf_get_by_addr(state->core_objs.buf_inv,

                                 state->core_objs.dst_mmap,

                                 state->dst_buffer,

                                 DMA_MEMCPY_SIZE,

                                 &state->dst_doca_buf);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR(

                 "Failed to initialize memory objects: Unable to acquire DOCA buffer representing dst buffer: %s",

                 doca_error_get_descr(status));

             return status;

         }

     }


     return DOCA_SUCCESS;

 }


 /*

  * Clean sample resources

  *

  * @state [in]: Sample objects to be destroyed

  */

 static void gpu_dma_cleanup(struct gpu_dma_sample_objects *state)

 {

     doca_error_t status;


     if (state->gpu_datapath) {

         DOCA_LOG_INFO("Cleanup DMA ctx with GPU data path");


         if (state->core_objs.ctx != NULL) {

             status = doca_ctx_stop(state->core_objs.ctx);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to stop dma ctx: %s",

                          doca_error_get_descr(status));

         }


         if (state->dma != NULL) {

             status = doca_dma_destroy(state->dma);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy dma: %s",

                          doca_error_get_descr(status));

         }


         if (state->core_objs.src_mmap != NULL) {

             status = doca_mmap_destroy(state->core_objs.src_mmap);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy src_mmap: %s",

                          doca_error_get_descr(status));

         }


         if (state->core_objs.dst_mmap != NULL) {

             status = doca_mmap_destroy(state->core_objs.dst_mmap);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy dst_mmap: %s",

                          doca_error_get_descr(status));

         }


         if (state->dst_buffer != NULL) {

             free(state->dst_buffer);

             state->dst_buffer = NULL;

         }


         if (state->src_buffer != NULL) {

             doca_gpu_mem_free(state->gpu_dev, (void *)state->src_buffer);

             state->src_buffer = NULL;

         }

     } else {

         DOCA_LOG_INFO("Cleanup DMA ctx with CPU data path");

         if (state->core_objs.ctx != NULL) {

             status = doca_ctx_stop(state->core_objs.ctx);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to stop dma ctx: %s",

                          doca_error_get_descr(status));

         }


         if (state->dma != NULL) {

             status = doca_dma_destroy(state->dma);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy dma: %s",

                          doca_error_get_descr(status));

         }


         if (state->dst_doca_buf != NULL) {

             status = doca_buf_dec_refcount(state->dst_doca_buf, NULL);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR(

                     "Failed to clean sample objects: Failed to decrease DOCA dst buffer reference count: %s",

                     doca_error_get_descr(status));

         }


         if (state->src_doca_buf != NULL) {

             status = doca_buf_dec_refcount(state->src_doca_buf, NULL);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR(

                     "Failed to clean sample objects: Failed to decrease DOCA src buffer reference count: %s",

                     doca_error_get_descr(status));

         }


         status = destroy_core_objects(&(state->core_objs));

         if (status != DOCA_SUCCESS)

             DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy core objects: %s",

                      doca_error_get_descr(status));


         if (state->dst_buffer != NULL) {

             doca_gpu_mem_free(state->gpu_dev, (void *)state->dst_buffer);

             state->dst_buffer = NULL;

         }


         if (state->src_buffer != NULL) {

             free(state->src_buffer);

             state->src_buffer = NULL;

         }


         if (state->gpu_dev != NULL) {

             status = doca_gpu_destroy(state->gpu_dev);

             if (status != DOCA_SUCCESS)

                 DOCA_LOG_ERR("Failed to clean sample objects: Failed to destroy doca gpu: %s",

                          doca_error_get_descr(status));

         }

     }

 }


 /*

  * Initialize dma context

  *

  * @state [in]: Sample objects

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 static doca_error_t init_dma_ctx(struct gpu_dma_sample_objects *state)

 {

     doca_error_t status;


     /* Create dma ctx */

     status = doca_dma_create(state->core_objs.dev, &state->dma);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize dma ctx: Unable to create DMA engine: %s",

                  doca_error_get_descr(status));

         return status;

     }


     state->core_objs.ctx = doca_dma_as_ctx(state->dma);


     if (state->gpu_datapath) {

         status = doca_ctx_set_datapath_on_gpu(state->core_objs.ctx, state->gpu_dev);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to set datapath on GPU: %s", doca_error_get_descr(status));

             return status;

         }

     } else {

         /* Connect context to progress engine */

         status = doca_pe_connect_ctx(state->core_objs.pe, state->core_objs.ctx);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to initialize dma ctx: Failed to connect PE to DMA: %s",

                      doca_error_get_descr(status));

             return status;

         }


         status = doca_dma_task_memcpy_set_conf(state->dma,

                                memcpy_task_common_callback,

                                memcpy_task_common_callback,

                                NUM_TASKS);

         if (status != DOCA_SUCCESS) {

             DOCA_LOG_ERR("Failed to initialize dma ctx: Unable to config DMA task %s",

                      doca_error_get_descr(status));

             return status;

         }

     }


     /* Start doca ctx */

     status = doca_ctx_start(state->core_objs.ctx);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to initialize dma ctx: Unable to start dma context: %s",

                  doca_error_get_descr(status));

         return status;

     }


     return DOCA_SUCCESS;

 }


 /*

  * Submit DMA Memcpy task

  *

  * @state [in]: Sample objects

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 static doca_error_t submit_dma_memcpy_task(struct gpu_dma_sample_objects *state)

 {

     doca_error_t status;

     struct doca_dma_task_memcpy *memcpy_task;

     struct doca_task *task;

     union doca_data memcpy_task_user_data = {0};

     struct timespec ts = {

         .tv_sec = 0,

         .tv_nsec = SLEEP_IN_NANOS,

     };


     /* Construct DMA task */

     status = doca_dma_task_memcpy_alloc_init(state->dma,

                          state->src_doca_buf,

                          state->dst_doca_buf,

                          memcpy_task_user_data,

                          &memcpy_task);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to submit dma memcpy task: Failed to allocate task: %s",

                  doca_error_get_descr(status));

         return status;

     }


     /* Submit DMA task */

     task = doca_dma_task_memcpy_as_task(memcpy_task);

     status = doca_task_submit(task);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Failed to submit dma memcpy task: %s", doca_error_get_descr(status));

         return status;

     }


     while (!is_task_done) {

         (void)doca_pe_progress(state->core_objs.pe);

         nanosleep(&ts, &ts);

     }


     /* Get task status */

     status = doca_task_get_status(task);


     /* Free task */

     doca_task_free(task);


     /* Check task status */

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("DMA task event returned unsuccessfully: %s", doca_error_get_descr(status));

         return status;

     }


     DOCA_LOG_INFO("Success, DMA memcpy job done successfully");


     return DOCA_SUCCESS;

 }


 /*

  * Launch a CUDA kernel to read from the GPU destination buffer

  *

  * @gpu_dst_buffer [in]: The GPU destination buffer address

  * @dma_gpu [in]: The GPU DMA object

  * @src_gpu_buf_arr [in]: The GPU buff array src

  * @dst_gpu_buf_arr [in]: The GPU buff array dest

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 static doca_error_t launch_cuda_kernel(uintptr_t gpu_dst_buffer,

                        struct doca_gpu_dma *dma_gpu,

                        struct doca_gpu_buf_arr *src_gpu_buf_arr,

                        struct doca_gpu_buf_arr *dst_gpu_buf_arr)

 {

     doca_error_t status;

     cudaStream_t cuda_stream;

     cudaError_t res_rt = cudaSuccess;


     res_rt = cudaStreamCreateWithFlags(&cuda_stream, cudaStreamNonBlocking);

     if (res_rt != cudaSuccess) {

         DOCA_LOG_ERR("Function cudaStreamCreateWithFlags error %d", res_rt);

         return DOCA_ERROR_DRIVER;

     }


     status = gpunetio_dma_memcpy_common_launch_kernel(cuda_stream,

                               gpu_dst_buffer,

                               dma_gpu,

                               src_gpu_buf_arr,

                               dst_gpu_buf_arr);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function dma_gpu_copy_common_launch_kernel returned %s", doca_error_get_descr(status));

         return status;

     }


     res_rt = cudaDeviceSynchronize();

     if (res_rt != cudaSuccess) {

         DOCA_LOG_ERR("Function cudaDeviceSynchronize error %d", res_rt);

         return DOCA_ERROR_DRIVER;

     }


     return DOCA_SUCCESS;

 }


 /*

  * GPU DMA Memcpy sample

  *

  * @cfg [in]: Sample config parameters

  * @return: DOCA_SUCCESS on success and DOCA_ERROR otherwise

  */

 doca_error_t gpunetio_dma_memcpy(struct gpu_dma_config *cfg)

 {

     doca_error_t status;

     struct gpu_dma_sample_objects state_cpu_gpu = {0};

     struct gpu_dma_sample_objects state_gpu_cpu = {0};


 #if 0

     struct doca_log_backend *stdout_logger = NULL;


     status = doca_log_backend_create_with_file_sdk(stdout, &stdout_logger);

     if (status != DOCA_SUCCESS)

             return status;


     status = doca_log_backend_set_sdk_level(stdout_logger, DOCA_LOG_LEVEL_TRACE);

     if (status != DOCA_SUCCESS)

             return status;


     if (cfg == NULL) {

         DOCA_LOG_ERR("Invalid sample configuration input value");

         return DOCA_ERROR_INVALID_VALUE;

     }

 #endif

     status = init_doca_device(cfg->nic_pcie_addr, &state_cpu_gpu.core_objs.dev);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function init_doca_device returned %s", doca_error_get_descr(status));

         return status;

     }


     status = doca_gpu_create(cfg->gpu_pcie_addr, &state_cpu_gpu.gpu_dev);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function doca_gpu_create returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     state_cpu_gpu.gpu_datapath = false;

     state_gpu_cpu.core_objs.dev = state_cpu_gpu.core_objs.dev;

     state_gpu_cpu.gpu_datapath = true;

     state_gpu_cpu.gpu_dev = state_cpu_gpu.gpu_dev;


     status = init_sample_mem_objs(&state_cpu_gpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function init_sample_mem_objs returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = init_sample_mem_objs(&state_gpu_cpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function init_sample_mem_objs returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = init_dma_ctx(&state_cpu_gpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function init_dma_ctx returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = init_dma_ctx(&state_gpu_cpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function init_dma_ctx returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = submit_dma_memcpy_task(&state_cpu_gpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function submit_dma_memcpy_task returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = doca_dma_get_gpu_handle(state_gpu_cpu.dma, &state_gpu_cpu.dma_gpu);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function submit_dma_memcpy_task returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     status = launch_cuda_kernel((uintptr_t)state_cpu_gpu.dst_buffer,

                     state_gpu_cpu.dma_gpu,

                     state_gpu_cpu.src_doca_gpu_buf_arr,

                     state_gpu_cpu.dst_doca_gpu_buf_arr);

     if (status != DOCA_SUCCESS) {

         DOCA_LOG_ERR("Function launch_cuda_kernel returned %s", doca_error_get_descr(status));

         goto gpu_dma_cleanup;

     }


     while (state_gpu_cpu.dst_buffer[0] == DEFAULT_VALUE)

         ;


     printf("CPU received message from GPU: %s\n", state_gpu_cpu.dst_buffer);


 gpu_dma_cleanup:

     gpu_dma_cleanup(&state_gpu_cpu);

     gpu_dma_cleanup(&state_cpu_gpu);


     return status;

 }

NULL
#define NULL
Definition: __stddef_null.h:26

destroy_core_objects
doca_error_t destroy_core_objects(struct program_core_objects *state)
Definition: common.c:392

create_core_objects
doca_error_t create_core_objects(struct program_core_objects *state, uint32_t max_bufs)
Definition: common.c:302

open_doca_device_with_pci
static doca_error_t open_doca_device_with_pci(const char *pcie_value, struct doca_dev **retval)
Definition: device.c:43

doca_buf.h

doca_buf_inventory.h

doca_log.h

doca_mmap.h

doca_pe.h

stdout_logger
struct doca_log_backend * stdout_logger
Definition: dpa_nvqual_sample.c:42

ddev
static struct doca_dev * ddev
Definition: gpu_packet_processing.c:41

gpunetio_dma_common.h

gpunetio_dma_memcpy_common_launch_kernel
doca_error_t gpunetio_dma_memcpy_common_launch_kernel(cudaStream_t stream, uintptr_t gpu_buffer_addr, struct doca_gpu_dma *dma_gpu, struct doca_gpu_buf_arr *src_gpu_buf_arr, struct doca_gpu_buf_arr *dst_gpu_buf_arr)

DMA_MEMCPY_SIZE
#define DMA_MEMCPY_SIZE
Definition: gpunetio_dma_common.h:43

launch_cuda_kernel
static doca_error_t launch_cuda_kernel(uintptr_t gpu_dst_buffer, struct doca_gpu_dma *dma_gpu, struct doca_gpu_buf_arr *src_gpu_buf_arr, struct doca_gpu_buf_arr *dst_gpu_buf_arr)
Definition: gpunetio_dma_memcpy_sample.c:564

memcpy_task_common_callback
static void memcpy_task_common_callback(struct doca_dma_task_memcpy *dma_task, union doca_data task_user_data, union doca_data ctx_user_data)
Definition: gpunetio_dma_memcpy_sample.c:75

DEFAULT_VALUE
#define DEFAULT_VALUE
Definition: gpunetio_dma_memcpy_sample.c:42

init_doca_device
static doca_error_t init_doca_device(char *nic_pcie_addr, struct doca_dev **ddev)
Definition: gpunetio_dma_memcpy_sample.c:94

DOCA_LOG_REGISTER
DOCA_LOG_REGISTER(GPU_DMA_MEMCPY::SAMPLE)

init_dma_ctx
static doca_error_t init_dma_ctx(struct gpu_dma_sample_objects *state)
Definition: gpunetio_dma_memcpy_sample.c:445

gpu_dma_cleanup
static void gpu_dma_cleanup(struct gpu_dma_sample_objects *state)
Definition: gpunetio_dma_memcpy_sample.c:339

is_task_done
static uint8_t is_task_done
Definition: gpunetio_dma_memcpy_sample.c:45

gpunetio_dma_memcpy
doca_error_t gpunetio_dma_memcpy(struct gpu_dma_config *cfg)
Definition: gpunetio_dma_memcpy_sample.c:604

GPU_PAGE_SIZE
#define GPU_PAGE_SIZE
Definition: gpunetio_dma_memcpy_sample.c:39

NUM_TASKS
#define NUM_TASKS
Definition: gpunetio_dma_memcpy_sample.c:40

NUM_BUFS
#define NUM_BUFS
Definition: gpunetio_dma_memcpy_sample.c:41

submit_dma_memcpy_task
static doca_error_t submit_dma_memcpy_task(struct gpu_dma_sample_objects *state)
Definition: gpunetio_dma_memcpy_sample.c:502

init_sample_mem_objs
static doca_error_t init_sample_mem_objs(struct gpu_dma_sample_objects *state)
Definition: gpunetio_dma_memcpy_sample.c:116

SLEEP_IN_NANOS
#define SLEEP_IN_NANOS
Definition: gpunetio_dma_memcpy_sample.c:38

doca_buf_arr_set_params
DOCA_EXPERIMENTAL doca_error_t doca_buf_arr_set_params(struct doca_buf_arr *buf_arr, struct doca_mmap *mmap, size_t elem_size, uint64_t start_offset)
Sets the buf array params.

doca_buf_arr_set_target_gpu
DOCA_EXPERIMENTAL doca_error_t doca_buf_arr_set_target_gpu(struct doca_buf_arr *buf_arr, struct doca_gpu *gpu_handler)
Configures the buf array to be created on the gpu device.

doca_buf_arr_get_gpu_handle
DOCA_EXPERIMENTAL doca_error_t doca_buf_arr_get_gpu_handle(const struct doca_buf_arr *buf_arr, struct doca_gpu_buf_arr **gpu_buf_arr)
Retrieves the handle in the gpu memory space of a doca_buf_arr.

doca_buf_arr_create
DOCA_EXPERIMENTAL doca_error_t doca_buf_arr_create(size_t num_elem, struct doca_buf_arr **buf_arr)
Allocates a doca_buf_arr.

doca_buf_arr_start
DOCA_EXPERIMENTAL doca_error_t doca_buf_arr_start(struct doca_buf_arr *buf_arr)
This method enables the allocation of doca_bufs.

doca_buf_inventory_buf_get_by_addr
static doca_error_t doca_buf_inventory_buf_get_by_addr(struct doca_buf_inventory *inventory, struct doca_mmap *mmap, void *addr, size_t len, struct doca_buf **buf)
Allocate single element from buffer inventory and point it to the buffer defined by addr & len argume...
Definition: doca_buf_inventory.h:197

doca_buf_inventory_buf_get_by_data
static doca_error_t doca_buf_inventory_buf_get_by_data(struct doca_buf_inventory *inventory, struct doca_mmap *mmap, void *data, size_t data_len, struct doca_buf **buf)
Allocate single element from buffer inventory and point it to the buffer defined by data & data_len a...
Definition: doca_buf_inventory.h:228

doca_buf_dec_refcount
DOCA_STABLE doca_error_t doca_buf_dec_refcount(struct doca_buf *buf, uint16_t *refcount)
Decrease the object reference count by 1, if 0 reached, return the element back to the inventory.

doca_ctx_start
DOCA_STABLE doca_error_t doca_ctx_start(struct doca_ctx *ctx)
Finalizes all configurations, and starts the DOCA CTX.

doca_ctx_set_datapath_on_gpu
DOCA_EXPERIMENTAL doca_error_t doca_ctx_set_datapath_on_gpu(struct doca_ctx *ctx, struct doca_gpu *gpu_dev)
This function binds the DOCA context to a gpu device.

doca_ctx_stop
DOCA_STABLE doca_error_t doca_ctx_stop(struct doca_ctx *ctx)
Stops the context allowing reconfiguration.

doca_dma_get_gpu_handle
DOCA_EXPERIMENTAL doca_error_t doca_dma_get_gpu_handle(struct doca_dma *dma, struct doca_gpu_dma **gpu_dma)
Retrieve the handle in the GPU memory space of a doca_dma.

doca_dma_task_memcpy_as_task
DOCA_STABLE struct doca_task * doca_dma_task_memcpy_as_task(struct doca_dma_task_memcpy *task)
This method converts a memcpy task to doca_task.

doca_dma_task_memcpy_alloc_init
DOCA_STABLE doca_error_t doca_dma_task_memcpy_alloc_init(struct doca_dma *dma, const struct doca_buf *src, struct doca_buf *dst, union doca_data user_data, struct doca_dma_task_memcpy **task)
This method allocates and initializes a DMA memcpy task.

doca_dma_as_ctx
DOCA_STABLE struct doca_ctx * doca_dma_as_ctx(struct doca_dma *dma)

doca_dma_task_memcpy_set_conf
DOCA_STABLE doca_error_t doca_dma_task_memcpy_set_conf(struct doca_dma *dma, doca_dma_task_memcpy_completion_cb_t task_completion_cb, doca_dma_task_memcpy_completion_cb_t task_error_cb, uint32_t num_memcpy_tasks)
This method sets the DMA memcpy tasks configuration.

doca_dma_create
DOCA_STABLE doca_error_t doca_dma_create(struct doca_dev *dev, struct doca_dma **dma)

doca_dma_destroy
DOCA_STABLE doca_error_t doca_dma_destroy(struct doca_dma *dma)

doca_error_t
enum doca_error doca_error_t
DOCA API return codes.

doca_error_get_descr
DOCA_STABLE const char * doca_error_get_descr(doca_error_t error)
Returns the description string of an error code.

DOCA_ERROR_INVALID_VALUE
@ DOCA_ERROR_INVALID_VALUE
Definition: doca_error.h:44

DOCA_SUCCESS
@ DOCA_SUCCESS
Definition: doca_error.h:38

DOCA_ERROR_NO_MEMORY
@ DOCA_ERROR_NO_MEMORY
Definition: doca_error.h:45

DOCA_ERROR_DRIVER
@ DOCA_ERROR_DRIVER
Definition: doca_error.h:59

DOCA_LOG_ERR
#define DOCA_LOG_ERR(format,...)
Generates an ERROR application log message.
Definition: doca_log.h:466

DOCA_LOG_INFO
#define DOCA_LOG_INFO(format,...)
Generates an INFO application log message.
Definition: doca_log.h:486

doca_log_backend_create_with_file_sdk
DOCA_EXPERIMENTAL doca_error_t doca_log_backend_create_with_file_sdk(FILE *fptr, struct doca_log_backend **backend)
Create a logging backend with a FILE* stream for SDK messages.

doca_log_backend_set_sdk_level
DOCA_EXPERIMENTAL doca_error_t doca_log_backend_set_sdk_level(struct doca_log_backend *backend, uint32_t level)
Set the log level limit for SDK logging backends.

DOCA_LOG_LEVEL_TRACE
@ DOCA_LOG_LEVEL_TRACE
Definition: doca_log.h:50

doca_mmap_set_memrange
DOCA_STABLE doca_error_t doca_mmap_set_memrange(struct doca_mmap *mmap, void *addr, size_t len)
Set the memory range of DOCA memory map.

doca_mmap_destroy
DOCA_STABLE doca_error_t doca_mmap_destroy(struct doca_mmap *mmap)
Destroy DOCA Memory Map structure.

doca_mmap_create
DOCA_STABLE doca_error_t doca_mmap_create(struct doca_mmap **mmap)
Allocates zero size memory map object with default/unset attributes.

doca_mmap_start
DOCA_STABLE doca_error_t doca_mmap_start(struct doca_mmap *mmap)
Start DOCA Memory Map.

doca_mmap_add_dev
DOCA_STABLE doca_error_t doca_mmap_add_dev(struct doca_mmap *mmap, struct doca_dev *dev)
Register DOCA memory map on a given device.

doca_task_get_status
DOCA_STABLE doca_error_t doca_task_get_status(const struct doca_task *task)
Get task status.

doca_pe_connect_ctx
DOCA_STABLE doca_error_t doca_pe_connect_ctx(struct doca_pe *pe, struct doca_ctx *ctx)
This method connects a context to a progress engine.

doca_task_submit
DOCA_STABLE doca_error_t doca_task_submit(struct doca_task *task)
Submit a task to a progress engine.

doca_pe_progress
DOCA_STABLE uint8_t doca_pe_progress(struct doca_pe *pe)
Run the progress engine.

doca_task_free
DOCA_STABLE void doca_task_free(struct doca_task *task)
Free a task back to where it was allocated from.

DOCA_GPU_MEM_TYPE_GPU_CPU
@ DOCA_GPU_MEM_TYPE_GPU_CPU
Definition: doca_types.h:133

DOCA_GPU_MEM_TYPE_GPU
@ DOCA_GPU_MEM_TYPE_GPU
Definition: doca_types.h:131

cfg
const struct ip_frag_config * cfg
Definition: ip_frag_dp.c:0

stdbool.h

uintptr_t
__UINTPTR_TYPE__ uintptr_t
Definition: stdint.h:298

gpu_dma_config
Definition: gpunetio_dma_common.h:46

gpu_dma_sample_objects
Definition: gpunetio_dma_memcpy_sample.c:52

gpu_dma_sample_objects::gpu_dev
struct doca_gpu * gpu_dev
Definition: gpunetio_dma_memcpy_sample.c:56

gpu_dma_sample_objects::src_doca_gpu_buf_arr
struct doca_gpu_buf_arr * src_doca_gpu_buf_arr
Definition: gpunetio_dma_memcpy_sample.c:61

gpu_dma_sample_objects::dst_doca_gpu_buf_arr
struct doca_gpu_buf_arr * dst_doca_gpu_buf_arr
Definition: gpunetio_dma_memcpy_sample.c:62

gpu_dma_sample_objects::dma_gpu
struct doca_gpu_dma * dma_gpu
Definition: gpunetio_dma_memcpy_sample.c:55

gpu_dma_sample_objects::dst_doca_buf
struct doca_buf * dst_doca_buf
Definition: gpunetio_dma_memcpy_sample.c:58

gpu_dma_sample_objects::src_doca_buf_arr
struct doca_buf_arr * src_doca_buf_arr
Definition: gpunetio_dma_memcpy_sample.c:59

gpu_dma_sample_objects::core_objs
struct program_core_objects core_objs
Definition: gpunetio_dma_memcpy_sample.c:53

gpu_dma_sample_objects::dst_doca_buf_arr
struct doca_buf_arr * dst_doca_buf_arr
Definition: gpunetio_dma_memcpy_sample.c:60

gpu_dma_sample_objects::src_buffer
char * src_buffer
Definition: gpunetio_dma_memcpy_sample.c:63

gpu_dma_sample_objects::gpu_datapath
bool gpu_datapath
Definition: gpunetio_dma_memcpy_sample.c:65

gpu_dma_sample_objects::src_doca_buf
struct doca_buf * src_doca_buf
Definition: gpunetio_dma_memcpy_sample.c:57

gpu_dma_sample_objects::dma
struct doca_dma * dma
Definition: gpunetio_dma_memcpy_sample.c:54

gpu_dma_sample_objects::dst_buffer
char * dst_buffer
Definition: gpunetio_dma_memcpy_sample.c:64

program_core_objects
Definition: common.h:45

program_core_objects::pe
struct doca_pe * pe
Definition: common.h:51

program_core_objects::src_mmap
struct doca_mmap * src_mmap
Definition: common.h:47

program_core_objects::buf_inv
struct doca_buf_inventory * buf_inv
Definition: common.h:49

program_core_objects::dev
struct doca_dev * dev
Definition: common.h:46

program_core_objects::dst_mmap
struct doca_mmap * dst_mmap
Definition: common.h:48

program_core_objects::ctx
struct doca_ctx * ctx
Definition: common.h:50

doca_data
Convenience type for representing opaque data.
Definition: doca_types.h:56