[PATCH libdrm 4/9] amdgpu: Add struct amdgpu_core_device and amdgpu_core_bo

Michel Dänzer Mon, 24 Jun 2019 09:55:14 -0700

From: Michel Dänzer <michel.daen...@amd.com>

They can be referenced by any number of struct amdgpu_device/bo, which
are used for amdgpu_device/bo_handle in the public API.


This allows keeping track of the DRM file descriptor passed to
amdgpu_device_initialize and the one used for CS submission etc.
separately. The core structs hold the information relevant for the
latter.

Because we now always keep a duplicate of the file descriptor passed to
amdgpu_device_initialize, we can use that for flink, and we no longer
need to check its authentication status (flink could never be expected
to work after passing an unauthenticated file descriptor to
amdgpu_device_initialize).

Signed-off-by: Michel Dänzer <michel.daen...@amd.com>
---
 amdgpu/amdgpu_asic_id.c       |   4 +-
 amdgpu/amdgpu_bo.c            | 251 ++++++++++++++++++++++------------
 amdgpu/amdgpu_cs.c            |  64 +++++----
 amdgpu/amdgpu_device.c        | 219 ++++++++++++-----------------
 amdgpu/amdgpu_gpu_info.c      |  35 ++---
 amdgpu/amdgpu_internal.h      |  27 ++--
 amdgpu/amdgpu_vamgr.c         |   9 +-
 amdgpu/amdgpu_vm.c            |   4 +-
 tests/amdgpu/amdgpu_test.c    |   2 +-
 tests/amdgpu/bo_tests.c       |   2 +-
 tests/amdgpu/cs_tests.c       |   8 +-
 tests/amdgpu/deadlock_tests.c |   8 +-
 tests/amdgpu/uvd_enc_tests.c  |   2 +-
 tests/amdgpu/vce_tests.c      |  12 +-
 tests/amdgpu/vcn_tests.c      |   4 +-
 tests/amdgpu/vm_tests.c       |   2 +-
 16 files changed, 360 insertions(+), 293 deletions(-)

diff --git a/amdgpu/amdgpu_asic_id.c b/amdgpu/amdgpu_asic_id.c
index a5007ffc..356c8a59 100644
--- a/amdgpu/amdgpu_asic_id.c
+++ b/amdgpu/amdgpu_asic_id.c
@@ -34,7 +34,7 @@
 #include "amdgpu_drm.h"
 #include "amdgpu_internal.h"
 
-static int parse_one_line(struct amdgpu_device *dev, const char *line)
+static int parse_one_line(struct amdgpu_core_device *dev, const char *line)
 {
        char *buf, *saveptr;
        char *s_did;
@@ -104,7 +104,7 @@ out:
        return r;
 }
 
-void amdgpu_parse_asic_ids(struct amdgpu_device *dev)
+void amdgpu_parse_asic_ids(struct amdgpu_core_device *dev)
 {
        FILE *fp;
        char *line = NULL;
diff --git a/amdgpu/amdgpu_bo.c b/amdgpu/amdgpu_bo.c
index 5bdb8fe8..7fec1f15 100644
--- a/amdgpu/amdgpu_bo.c
+++ b/amdgpu/amdgpu_bo.c
@@ -47,15 +47,15 @@ static int amdgpu_close_kms_handle(int fd, uint32_t handle)
        return drmIoctl(fd, DRM_IOCTL_GEM_CLOSE, &args);
 }
 
-static int amdgpu_bo_create(amdgpu_device_handle dev,
-                           uint64_t size,
-                           uint32_t handle,
-                           amdgpu_bo_handle *buf_handle)
+static int amdgpu_core_bo_create(struct amdgpu_core_device *dev,
+                                uint64_t size,
+                                uint32_t handle,
+                                struct amdgpu_core_bo **out_bo)
 {
-       struct amdgpu_bo *bo;
+       struct amdgpu_core_bo *bo;
        int r;
 
-       bo = calloc(1, sizeof(struct amdgpu_bo));
+       bo = calloc(1, sizeof(struct amdgpu_core_bo));
        if (!bo)
                return -ENOMEM;
 
@@ -66,19 +66,64 @@ static int amdgpu_bo_create(amdgpu_device_handle dev,
        }
 
        atomic_set(&bo->refcount, 1);
-       bo->dev = dev;
        bo->alloc_size = size;
        bo->handle = handle;
        pthread_mutex_init(&bo->cpu_access_mutex, NULL);
 
-       *buf_handle = bo;
+       *out_bo = bo;
        return 0;
 }
 
-drm_public int amdgpu_bo_alloc(amdgpu_device_handle dev,
+static int amdgpu_bo_create(amdgpu_device_handle user_dev,
+                           uint64_t size,
+                           uint32_t handle,
+                           amdgpu_bo_handle *buf_handle)
+{
+       struct amdgpu_core_device *dev = user_dev->core;
+       struct amdgpu_bo *user_bo = NULL;
+       struct amdgpu_core_bo *bo;
+       int r;
+
+       bo = handle_table_lookup(&dev->bo_handles, handle);
+
+       if (bo) {
+               for (user_bo = bo->user_bos; user_bo; user_bo = user_bo->next) {
+                       if (user_bo->dev == user_dev) {
+                               /* Re-use existing buffer */
+                               atomic_inc(&user_bo->refcount);
+                               r = 0;
+                               goto out;
+                       }
+               }
+               atomic_inc(&bo->refcount);
+       } else {
+               r = amdgpu_core_bo_create(dev, size, handle, &bo);
+               if (r)
+                       goto out;
+       }
+
+       user_bo = calloc(1, sizeof(struct amdgpu_bo));
+       if (!user_bo) {
+               r = -ENOMEM;
+               goto out;
+       }
+
+       atomic_set(&user_bo->refcount, 1);
+       user_bo->next = bo->user_bos;
+       bo->user_bos = user_bo;
+       user_bo->core = bo;
+       user_bo->dev = user_dev;
+
+out:
+       *buf_handle = user_bo;
+       return r;
+}
+
+drm_public int amdgpu_bo_alloc(amdgpu_device_handle user_dev,
                               struct amdgpu_bo_alloc_request *alloc_buffer,
                               amdgpu_bo_handle *buf_handle)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        union drm_amdgpu_gem_create args;
        int r;
 
@@ -97,8 +142,8 @@ drm_public int amdgpu_bo_alloc(amdgpu_device_handle dev,
                goto out;
 
        pthread_mutex_lock(&dev->bo_table_mutex);
-       r = amdgpu_bo_create(dev, alloc_buffer->alloc_size, args.out.handle,
-                            buf_handle);
+       r = amdgpu_bo_create(user_dev, alloc_buffer->alloc_size,
+                            args.out.handle, buf_handle);
        pthread_mutex_unlock(&dev->bo_table_mutex);
        if (r) {
                amdgpu_close_kms_handle(dev->fd, args.out.handle);
@@ -108,9 +153,10 @@ out:
        return r;
 }
 
-drm_public int amdgpu_bo_set_metadata(amdgpu_bo_handle bo,
+drm_public int amdgpu_bo_set_metadata(amdgpu_bo_handle user_bo,
                                      struct amdgpu_bo_metadata *info)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
        struct drm_amdgpu_gem_metadata args = {};
 
        args.handle = bo->handle;
@@ -126,17 +172,19 @@ drm_public int amdgpu_bo_set_metadata(amdgpu_bo_handle bo,
                memcpy(args.data.data, info->umd_metadata, info->size_metadata);
        }
 
-       return drmCommandWriteRead(bo->dev->fd,
+       return drmCommandWriteRead(user_bo->dev->core->fd,
                                   DRM_AMDGPU_GEM_METADATA,
                                   &args, sizeof(args));
 }
 
-drm_public int amdgpu_bo_query_info(amdgpu_bo_handle bo,
+drm_public int amdgpu_bo_query_info(amdgpu_bo_handle user_bo,
                                    struct amdgpu_bo_info *info)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
        struct drm_amdgpu_gem_metadata metadata = {};
        struct drm_amdgpu_gem_create_in bo_info = {};
        struct drm_amdgpu_gem_op gem_op = {};
+       int fd = user_bo->dev->core->fd;
        int r;
 
        /* Validate the BO passed in */
@@ -147,8 +195,8 @@ drm_public int amdgpu_bo_query_info(amdgpu_bo_handle bo,
        metadata.handle = bo->handle;
        metadata.op = AMDGPU_GEM_METADATA_OP_GET_METADATA;
 
-       r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_METADATA,
-                               &metadata, sizeof(metadata));
+       r = drmCommandWriteRead(fd, DRM_AMDGPU_GEM_METADATA, &metadata,
+                               sizeof(metadata));
        if (r)
                return r;
 
@@ -161,8 +209,7 @@ drm_public int amdgpu_bo_query_info(amdgpu_bo_handle bo,
        gem_op.op = AMDGPU_GEM_OP_GET_GEM_CREATE_INFO;
        gem_op.value = (uintptr_t)&bo_info;
 
-       r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_OP,
-                               &gem_op, sizeof(gem_op));
+       r = drmCommandWriteRead(fd, DRM_AMDGPU_GEM_OP, &gem_op, sizeof(gem_op));
        if (r)
                return r;
 
@@ -182,29 +229,30 @@ drm_public int amdgpu_bo_query_info(amdgpu_bo_handle bo,
        return 0;
 }
 
-static int amdgpu_bo_export_flink(amdgpu_bo_handle bo)
+static int amdgpu_bo_export_flink(amdgpu_bo_handle user_bo)
 {
+       struct amdgpu_core_device *dev = user_bo->dev->core;
+       struct amdgpu_core_bo *bo = user_bo->core;
+       int user_fd = user_bo->dev->user_fd;
        struct drm_gem_flink flink;
        int fd, dma_fd;
        uint32_t handle;
        int r;
 
-       fd = bo->dev->fd;
+       fd = dev->fd;
        handle = bo->handle;
        if (bo->flink_name)
                return 0;
 
-
-       if (bo->dev->flink_fd != bo->dev->fd) {
-               r = drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
-                                      &dma_fd);
+       if (user_fd != fd) {
+               r = drmPrimeHandleToFD(fd, bo->handle, DRM_CLOEXEC, &dma_fd);
                if (!r) {
-                       r = drmPrimeFDToHandle(bo->dev->flink_fd, dma_fd, 
&handle);
+                       r = drmPrimeFDToHandle(user_fd, dma_fd, &handle);
                        close(dma_fd);
                }
                if (r)
                        return r;
-               fd = bo->dev->flink_fd;
+               fd = user_fd;
        }
        memset(&flink, 0, sizeof(flink));
        flink.handle = handle;
@@ -215,25 +263,26 @@ static int amdgpu_bo_export_flink(amdgpu_bo_handle bo)
 
        bo->flink_name = flink.name;
 
-       if (bo->dev->flink_fd != bo->dev->fd)
-               amdgpu_close_kms_handle(bo->dev->flink_fd, handle);
+       if (user_fd != dev->fd)
+               amdgpu_close_kms_handle(user_fd, handle);
 
-       pthread_mutex_lock(&bo->dev->bo_table_mutex);
-       r = handle_table_insert(&bo->dev->bo_flink_names, bo->flink_name, bo);
-       pthread_mutex_unlock(&bo->dev->bo_table_mutex);
+       pthread_mutex_lock(&dev->bo_table_mutex);
+       r = handle_table_insert(&dev->bo_flink_names, bo->flink_name, bo);
+       pthread_mutex_unlock(&dev->bo_table_mutex);
 
        return r;
 }
 
-drm_public int amdgpu_bo_export(amdgpu_bo_handle bo,
+drm_public int amdgpu_bo_export(amdgpu_bo_handle user_bo,
                                enum amdgpu_bo_handle_type type,
                                uint32_t *shared_handle)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
        int r;
 
        switch (type) {
        case amdgpu_bo_handle_type_gem_flink_name:
-               r = amdgpu_bo_export_flink(bo);
+               r = amdgpu_bo_export_flink(user_bo);
                if (r)
                        return r;
 
@@ -246,21 +295,24 @@ drm_public int amdgpu_bo_export(amdgpu_bo_handle bo,
                return 0;
 
        case amdgpu_bo_handle_type_dma_buf_fd:
-               return drmPrimeHandleToFD(bo->dev->fd, bo->handle,
+               return drmPrimeHandleToFD(user_bo->dev->core->fd, bo->handle,
                                          DRM_CLOEXEC | DRM_RDWR,
                                          (int*)shared_handle);
        }
        return -EINVAL;
 }
 
-drm_public int amdgpu_bo_import(amdgpu_device_handle dev,
+drm_public int amdgpu_bo_import(amdgpu_device_handle user_dev,
                                enum amdgpu_bo_handle_type type,
                                uint32_t shared_handle,
-                    struct amdgpu_bo_import_result *output)
+                               struct amdgpu_bo_import_result *output)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        struct drm_gem_open open_arg = {};
-       struct amdgpu_bo *bo = NULL;
+       struct amdgpu_bo *user_bo = NULL;
        uint32_t handle = 0, flink_name = 0;
+       int user_fd = user_dev->user_fd;
+       struct amdgpu_core_bo *bo;
        uint64_t alloc_size = 0;
        int r = 0;
        int dma_fd;
@@ -313,37 +365,32 @@ drm_public int amdgpu_bo_import(amdgpu_device_handle dev,
        }
 
        if (bo) {
-               /* The buffer already exists, just bump the refcount. */
-               atomic_inc(&bo->refcount);
-               pthread_mutex_unlock(&dev->bo_table_mutex);
-
-               output->buf_handle = bo;
-               output->alloc_size = bo->alloc_size;
-               return 0;
+               handle = bo->handle;
+               alloc_size = bo->alloc_size;
+               goto bo_create;
        }
 
        /* Open the handle. */
        switch (type) {
        case amdgpu_bo_handle_type_gem_flink_name:
                open_arg.name = shared_handle;
-               r = drmIoctl(dev->flink_fd, DRM_IOCTL_GEM_OPEN, &open_arg);
+               r = drmIoctl(user_fd, DRM_IOCTL_GEM_OPEN, &open_arg);
                if (r)
                        goto unlock;
 
                flink_name = shared_handle;
                handle = open_arg.handle;
                alloc_size = open_arg.size;
-               if (dev->flink_fd != dev->fd) {
-                       r = drmPrimeHandleToFD(dev->flink_fd, handle,
-                                              DRM_CLOEXEC, &dma_fd);
+               if (user_fd != dev->fd) {
+                       r = drmPrimeHandleToFD(user_fd, handle, DRM_CLOEXEC,
+                                              &dma_fd);
                        if (r)
                                goto free_bo_handle;
                        r = drmPrimeFDToHandle(dev->fd, dma_fd, &handle);
                        close(dma_fd);
                        if (r)
                                goto free_bo_handle;
-                       r = amdgpu_close_kms_handle(dev->flink_fd,
-                                                   open_arg.handle);
+                       r = amdgpu_close_kms_handle(user_fd, open_arg.handle);
                        if (r)
                                goto free_bo_handle;
                }
@@ -360,11 +407,13 @@ drm_public int amdgpu_bo_import(amdgpu_device_handle dev,
                assert(0); /* unreachable */
        }
 
+bo_create:
        /* Initialize it. */
-       r = amdgpu_bo_create(dev, alloc_size, handle, &bo);
+       r = amdgpu_bo_create(user_dev, alloc_size, handle, &user_bo);
        if (r)
                goto free_bo_handle;
 
+       bo = user_bo->core;
        if (flink_name) {
                bo->flink_name = flink_name;
                r = handle_table_insert(&dev->bo_flink_names, flink_name,
@@ -374,17 +423,17 @@ drm_public int amdgpu_bo_import(amdgpu_device_handle dev,
 
        }
 
-       output->buf_handle = bo;
+       output->buf_handle = user_bo;
        output->alloc_size = bo->alloc_size;
        pthread_mutex_unlock(&dev->bo_table_mutex);
        return 0;
 
 free_bo_handle:
        if (flink_name && open_arg.handle)
-               amdgpu_close_kms_handle(dev->flink_fd, open_arg.handle);
+               amdgpu_close_kms_handle(user_fd, open_arg.handle);
 
-       if (bo)
-               amdgpu_bo_free(bo);
+       if (user_bo)
+               amdgpu_bo_free(user_bo);
        else
                amdgpu_close_kms_handle(dev->fd, handle);
 unlock:
@@ -392,14 +441,10 @@ unlock:
        return r;
 }
 
-drm_public int amdgpu_bo_free(amdgpu_bo_handle buf_handle)
+static void amdgpu_core_bo_free(struct amdgpu_bo *user_bo)
 {
-       struct amdgpu_device *dev;
-       struct amdgpu_bo *bo = buf_handle;
-
-       assert(bo != NULL);
-       dev = bo->dev;
-       pthread_mutex_lock(&dev->bo_table_mutex);
+       struct amdgpu_core_device *dev = user_bo->dev->core;
+       struct amdgpu_core_bo *bo = user_bo->core;
 
        if (update_references(&bo->refcount, NULL)) {
                /* Remove the buffer from the hash tables. */
@@ -412,12 +457,39 @@ drm_public int amdgpu_bo_free(amdgpu_bo_handle buf_handle)
                /* Release CPU access. */
                if (bo->cpu_map_count > 0) {
                        bo->cpu_map_count = 1;
-                       amdgpu_bo_cpu_unmap(bo);
+                       amdgpu_bo_cpu_unmap(user_bo);
                }
 
                amdgpu_close_kms_handle(dev->fd, bo->handle);
                pthread_mutex_destroy(&bo->cpu_access_mutex);
                free(bo);
+       } else if (bo->user_bos == user_bo) {
+               bo->user_bos = user_bo->next;
+       } else {
+               struct amdgpu_bo *iter;
+
+               for (iter = bo->user_bos; iter->next; iter = iter->next) {
+                       if (iter->next == user_bo) {
+                               iter->next = user_bo->next;
+                               break;
+                       }
+               }
+       }
+}
+
+drm_public int amdgpu_bo_free(amdgpu_bo_handle buf_handle)
+{
+       struct amdgpu_bo *user_bo = buf_handle;
+       struct amdgpu_core_device *dev;
+
+       assert(user_bo != NULL);
+       dev = user_bo->dev->core;
+
+       pthread_mutex_lock(&dev->bo_table_mutex);
+
+       if (update_references(&user_bo->refcount, NULL)) {
+               amdgpu_core_bo_free(user_bo);
+               free(user_bo);
        }
 
        pthread_mutex_unlock(&dev->bo_table_mutex);
@@ -430,8 +502,10 @@ drm_public void amdgpu_bo_inc_ref(amdgpu_bo_handle bo)
        atomic_inc(&bo->refcount);
 }
 
-drm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void **cpu)
+drm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle user_bo, void **cpu)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
+       int fd = user_bo->dev->core->fd;
        union drm_amdgpu_gem_mmap args;
        void *ptr;
        int r;
@@ -455,8 +529,7 @@ drm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void 
**cpu)
         * The kernel driver ignores the offset and size parameters. */
        args.in.handle = bo->handle;
 
-       r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_MMAP, &args,
-                               sizeof(args));
+       r = drmCommandWriteRead(fd, DRM_AMDGPU_GEM_MMAP, &args, sizeof(args));
        if (r) {
                pthread_mutex_unlock(&bo->cpu_access_mutex);
                return r;
@@ -464,7 +537,7 @@ drm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void 
**cpu)
 
        /* Map the buffer. */
        ptr = drm_mmap(NULL, bo->alloc_size, PROT_READ | PROT_WRITE, MAP_SHARED,
-                      bo->dev->fd, args.out.addr_ptr);
+                      fd, args.out.addr_ptr);
        if (ptr == MAP_FAILED) {
                pthread_mutex_unlock(&bo->cpu_access_mutex);
                return -errno;
@@ -478,8 +551,9 @@ drm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void 
**cpu)
        return 0;
 }
 
-drm_public int amdgpu_bo_cpu_unmap(amdgpu_bo_handle bo)
+drm_public int amdgpu_bo_cpu_unmap(amdgpu_bo_handle user_bo)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
        int r;
 
        pthread_mutex_lock(&bo->cpu_access_mutex);
@@ -504,18 +578,21 @@ drm_public int amdgpu_bo_cpu_unmap(amdgpu_bo_handle bo)
        return r;
 }
 
-drm_public int amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
+drm_public int amdgpu_query_buffer_size_alignment(amdgpu_device_handle 
user_dev,
                                struct amdgpu_buffer_size_alignments *info)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
+
        info->size_local = dev->dev_info.pte_fragment_size;
        info->size_remote = dev->dev_info.gart_page_size;
        return 0;
 }
 
-drm_public int amdgpu_bo_wait_for_idle(amdgpu_bo_handle bo,
+drm_public int amdgpu_bo_wait_for_idle(amdgpu_bo_handle user_bo,
                                       uint64_t timeout_ns,
                            bool *busy)
 {
+       struct amdgpu_core_bo *bo = user_bo->core;
        union drm_amdgpu_gem_wait_idle args;
        int r;
 
@@ -523,7 +600,7 @@ drm_public int amdgpu_bo_wait_for_idle(amdgpu_bo_handle bo,
        args.in.handle = bo->handle;
        args.in.timeout = amdgpu_cs_calculate_timeout(timeout_ns);
 
-       r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_WAIT_IDLE,
+       r = drmCommandWriteRead(user_bo->dev->core->fd, 
DRM_AMDGPU_GEM_WAIT_IDLE,
                                &args, sizeof(args));
 
        if (r == 0) {
@@ -535,13 +612,14 @@ drm_public int amdgpu_bo_wait_for_idle(amdgpu_bo_handle 
bo,
        }
 }
 
-drm_public int amdgpu_find_bo_by_cpu_mapping(amdgpu_device_handle dev,
+drm_public int amdgpu_find_bo_by_cpu_mapping(amdgpu_device_handle user_dev,
                                             void *cpu,
                                             uint64_t size,
                                             amdgpu_bo_handle *buf_handle,
                                             uint64_t *offset_in_bo)
 {
-       struct amdgpu_bo *bo;
+       struct amdgpu_core_device *dev = user_dev->core;
+       struct amdgpu_core_bo *bo;
        uint32_t i;
        int r = 0;
 
@@ -564,8 +642,8 @@ drm_public int 
amdgpu_find_bo_by_cpu_mapping(amdgpu_device_handle dev,
        }
 
        if (i < dev->bo_handles.max_key) {
-               atomic_inc(&bo->refcount);
-               *buf_handle = bo;
+               r = amdgpu_bo_create(user_dev, bo->alloc_size, bo->handle,
+                                    buf_handle);
                *offset_in_bo = (uintptr_t)cpu - (uintptr_t)bo->cpu_ptr;
        } else {
                *buf_handle = NULL;
@@ -577,11 +655,12 @@ drm_public int 
amdgpu_find_bo_by_cpu_mapping(amdgpu_device_handle dev,
        return r;
 }
 
-drm_public int amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
+drm_public int amdgpu_create_bo_from_user_mem(amdgpu_device_handle user_dev,
                                              void *cpu,
                                              uint64_t size,
                                              amdgpu_bo_handle *buf_handle)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        int r;
        struct drm_amdgpu_gem_userptr args;
 
@@ -595,7 +674,7 @@ drm_public int 
amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
                goto out;
 
        pthread_mutex_lock(&dev->bo_table_mutex);
-       r = amdgpu_bo_create(dev, size, args.handle, buf_handle);
+       r = amdgpu_bo_create(user_dev, size, args.handle, buf_handle);
        pthread_mutex_unlock(&dev->bo_table_mutex);
        if (r) {
                amdgpu_close_kms_handle(dev->fd, args.handle);
@@ -605,11 +684,12 @@ out:
        return r;
 }
 
-drm_public int amdgpu_bo_list_create_raw(amdgpu_device_handle dev,
+drm_public int amdgpu_bo_list_create_raw(amdgpu_device_handle user_dev,
                                         uint32_t number_of_buffers,
                                         struct drm_amdgpu_bo_list_entry 
*buffers,
                                         uint32_t *result)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        union drm_amdgpu_bo_list args;
        int r;
 
@@ -626,9 +706,10 @@ drm_public int 
amdgpu_bo_list_create_raw(amdgpu_device_handle dev,
        return r;
 }
 
-drm_public int amdgpu_bo_list_destroy_raw(amdgpu_device_handle dev,
+drm_public int amdgpu_bo_list_destroy_raw(amdgpu_device_handle user_dev,
                                          uint32_t bo_list)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        union drm_amdgpu_bo_list args;
 
        memset(&args, 0, sizeof(args));
@@ -639,12 +720,13 @@ drm_public int 
amdgpu_bo_list_destroy_raw(amdgpu_device_handle dev,
                                   &args, sizeof(args));
 }
 
-drm_public int amdgpu_bo_list_create(amdgpu_device_handle dev,
+drm_public int amdgpu_bo_list_create(amdgpu_device_handle user_dev,
                                     uint32_t number_of_resources,
                                     amdgpu_bo_handle *resources,
                                     uint8_t *resource_prios,
                                     amdgpu_bo_list_handle *result)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        struct drm_amdgpu_bo_list_entry *list;
        union drm_amdgpu_bo_list args;
        unsigned i;
@@ -674,7 +756,7 @@ drm_public int amdgpu_bo_list_create(amdgpu_device_handle 
dev,
        args.in.bo_info_ptr = (uint64_t)(uintptr_t)list;
 
        for (i = 0; i < number_of_resources; i++) {
-               list[i].bo_handle = resources[i]->handle;
+               list[i].bo_handle = resources[i]->core->handle;
                if (resource_prios)
                        list[i].bo_priority = resource_prios[i];
                else
@@ -740,7 +822,7 @@ drm_public int amdgpu_bo_list_update(amdgpu_bo_list_handle 
handle,
        args.in.bo_info_ptr = (uintptr_t)list;
 
        for (i = 0; i < number_of_resources; i++) {
-               list[i].bo_handle = resources[i]->handle;
+               list[i].bo_handle = resources[i]->core->handle;
                if (resource_prios)
                        list[i].bo_priority = resource_prios[i];
                else
@@ -770,7 +852,7 @@ drm_public int amdgpu_bo_va_op(amdgpu_bo_handle bo,
                                   AMDGPU_VM_PAGE_EXECUTABLE, ops);
 }
 
-drm_public int amdgpu_bo_va_op_raw(amdgpu_device_handle dev,
+drm_public int amdgpu_bo_va_op_raw(amdgpu_device_handle user_dev,
                                   amdgpu_bo_handle bo,
                                   uint64_t offset,
                                   uint64_t size,
@@ -778,6 +860,7 @@ drm_public int amdgpu_bo_va_op_raw(amdgpu_device_handle dev,
                                   uint64_t flags,
                                   uint32_t ops)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        struct drm_amdgpu_gem_va va;
        int r;
 
@@ -786,7 +869,7 @@ drm_public int amdgpu_bo_va_op_raw(amdgpu_device_handle dev,
                return -EINVAL;
 
        memset(&va, 0, sizeof(va));
-       va.handle = bo ? bo->handle : 0;
+       va.handle = bo ? bo->core->handle : 0;
        va.operation = ops;
        va.flags = flags;
        va.va_address = addr;
diff --git a/amdgpu/amdgpu_cs.c b/amdgpu/amdgpu_cs.c
index 20d5aef2..98130105 100644
--- a/amdgpu/amdgpu_cs.c
+++ b/amdgpu/amdgpu_cs.c
@@ -48,22 +48,24 @@ static int amdgpu_cs_reset_sem(amdgpu_semaphore_handle sem);
  *
  * \return  0 on success otherwise POSIX Error code
 */
-drm_public int amdgpu_cs_ctx_create2(amdgpu_device_handle dev,
+drm_public int amdgpu_cs_ctx_create2(amdgpu_device_handle user_dev,
                                     uint32_t priority,
                                     amdgpu_context_handle *context)
 {
        struct amdgpu_context *gpu_context;
+       struct amdgpu_core_device *dev;
        union drm_amdgpu_ctx args;
        int i, j, k;
        int r;
 
-       if (!dev || !context)
+       if (!user_dev || !context)
                return -EINVAL;
 
        gpu_context = calloc(1, sizeof(struct amdgpu_context));
        if (!gpu_context)
                return -ENOMEM;
 
+       dev = user_dev->core;
        gpu_context->dev = dev;
 
        r = pthread_mutex_init(&gpu_context->sequence_mutex, NULL);
@@ -156,7 +158,7 @@ drm_public int 
amdgpu_cs_ctx_override_priority(amdgpu_device_handle dev,
        memset(&args, 0, sizeof(args));
 
        args.in.op = AMDGPU_SCHED_OP_CONTEXT_PRIORITY_OVERRIDE;
-       args.in.fd = dev->fd;
+       args.in.fd = dev->core->fd;
        args.in.priority = priority;
        args.in.ctx_id = context->id;
 
@@ -269,7 +271,7 @@ static int amdgpu_cs_submit_one(amdgpu_context_handle 
context,
                chunks[i].chunk_data = (uint64_t)(uintptr_t)&chunk_data[i];
 
                /* fence bo handle */
-               chunk_data[i].fence_data.handle = 
ibs_request->fence_info.handle->handle;
+               chunk_data[i].fence_data.handle = 
ibs_request->fence_info.handle->core->handle;
                /* offset */
                chunk_data[i].fence_data.offset = 
                        ibs_request->fence_info.offset * sizeof(uint64_t);
@@ -409,7 +411,7 @@ static int amdgpu_ioctl_wait_cs(amdgpu_context_handle 
context,
                                uint64_t flags,
                                bool *busy)
 {
-       amdgpu_device_handle dev = context->dev;
+       struct amdgpu_core_device *dev = context->dev;
        union drm_amdgpu_wait_cs args;
        int r;
 
@@ -471,8 +473,8 @@ static int amdgpu_ioctl_wait_fences(struct amdgpu_cs_fence 
*fences,
                                    uint32_t *status,
                                    uint32_t *first)
 {
+       struct amdgpu_core_device *dev = fences[0].context->dev;
        struct drm_amdgpu_fence *drm_fences;
-       amdgpu_device_handle dev = fences[0].context->dev;
        union drm_amdgpu_wait_fences args;
        int r;
        uint32_t i;
@@ -633,7 +635,7 @@ drm_public int 
amdgpu_cs_create_syncobj2(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjCreate(dev->fd, flags, handle);
+       return drmSyncobjCreate(dev->core->fd, flags, handle);
 }
 
 drm_public int amdgpu_cs_create_syncobj(amdgpu_device_handle dev,
@@ -642,7 +644,7 @@ drm_public int 
amdgpu_cs_create_syncobj(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjCreate(dev->fd, 0, handle);
+       return drmSyncobjCreate(dev->core->fd, 0, handle);
 }
 
 drm_public int amdgpu_cs_destroy_syncobj(amdgpu_device_handle dev,
@@ -651,7 +653,7 @@ drm_public int 
amdgpu_cs_destroy_syncobj(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjDestroy(dev->fd, handle);
+       return drmSyncobjDestroy(dev->core->fd, handle);
 }
 
 drm_public int amdgpu_cs_syncobj_reset(amdgpu_device_handle dev,
@@ -661,7 +663,7 @@ drm_public int amdgpu_cs_syncobj_reset(amdgpu_device_handle 
dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjReset(dev->fd, syncobjs, syncobj_count);
+       return drmSyncobjReset(dev->core->fd, syncobjs, syncobj_count);
 }
 
 drm_public int amdgpu_cs_syncobj_signal(amdgpu_device_handle dev,
@@ -671,7 +673,7 @@ drm_public int 
amdgpu_cs_syncobj_signal(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjSignal(dev->fd, syncobjs, syncobj_count);
+       return drmSyncobjSignal(dev->core->fd, syncobjs, syncobj_count);
 }
 
 drm_public int amdgpu_cs_syncobj_timeline_signal(amdgpu_device_handle dev,
@@ -682,7 +684,7 @@ drm_public int 
amdgpu_cs_syncobj_timeline_signal(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjTimelineSignal(dev->fd, syncobjs,
+       return drmSyncobjTimelineSignal(dev->core->fd, syncobjs,
                                        points, syncobj_count);
 }
 
@@ -694,7 +696,7 @@ drm_public int amdgpu_cs_syncobj_wait(amdgpu_device_handle 
dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjWait(dev->fd, handles, num_handles, timeout_nsec,
+       return drmSyncobjWait(dev->core->fd, handles, num_handles, timeout_nsec,
                              flags, first_signaled);
 }
 
@@ -707,7 +709,7 @@ drm_public int 
amdgpu_cs_syncobj_timeline_wait(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjTimelineWait(dev->fd, handles, points, num_handles,
+       return drmSyncobjTimelineWait(dev->core->fd, handles, points, 
num_handles,
                                      timeout_nsec, flags, first_signaled);
 }
 
@@ -718,7 +720,7 @@ drm_public int amdgpu_cs_syncobj_query(amdgpu_device_handle 
dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjQuery(dev->fd, handles, points, num_handles);
+       return drmSyncobjQuery(dev->core->fd, handles, points, num_handles);
 }
 
 drm_public int amdgpu_cs_export_syncobj(amdgpu_device_handle dev,
@@ -728,7 +730,7 @@ drm_public int 
amdgpu_cs_export_syncobj(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjHandleToFD(dev->fd, handle, shared_fd);
+       return drmSyncobjHandleToFD(dev->core->fd, handle, shared_fd);
 }
 
 drm_public int amdgpu_cs_import_syncobj(amdgpu_device_handle dev,
@@ -738,7 +740,7 @@ drm_public int 
amdgpu_cs_import_syncobj(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjFDToHandle(dev->fd, shared_fd, handle);
+       return drmSyncobjFDToHandle(dev->core->fd, shared_fd, handle);
 }
 
 drm_public int amdgpu_cs_syncobj_export_sync_file(amdgpu_device_handle dev,
@@ -748,7 +750,7 @@ drm_public int 
amdgpu_cs_syncobj_export_sync_file(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjExportSyncFile(dev->fd, syncobj, sync_file_fd);
+       return drmSyncobjExportSyncFile(dev->core->fd, syncobj, sync_file_fd);
 }
 
 drm_public int amdgpu_cs_syncobj_import_sync_file(amdgpu_device_handle dev,
@@ -758,21 +760,24 @@ drm_public int 
amdgpu_cs_syncobj_import_sync_file(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjImportSyncFile(dev->fd, syncobj, sync_file_fd);
+       return drmSyncobjImportSyncFile(dev->core->fd, syncobj, sync_file_fd);
 }
 
-drm_public int amdgpu_cs_syncobj_export_sync_file2(amdgpu_device_handle dev,
+drm_public int amdgpu_cs_syncobj_export_sync_file2(amdgpu_device_handle 
user_dev,
                                                   uint32_t syncobj,
                                                   uint64_t point,
                                                   uint32_t flags,
                                                   int *sync_file_fd)
 {
+       struct amdgpu_core_device *dev;
        uint32_t binary_handle;
        int ret;
 
-       if (NULL == dev)
+       if (!user_dev)
                return -EINVAL;
 
+       dev = user_dev->core;
+
        if (!point)
                return drmSyncobjExportSyncFile(dev->fd, syncobj, sync_file_fd);
 
@@ -790,17 +795,20 @@ out:
        return ret;
 }
 
-drm_public int amdgpu_cs_syncobj_import_sync_file2(amdgpu_device_handle dev,
+drm_public int amdgpu_cs_syncobj_import_sync_file2(amdgpu_device_handle 
user_dev,
                                                   uint32_t syncobj,
                                                   uint64_t point,
                                                   int sync_file_fd)
 {
+       struct amdgpu_core_device *dev;
        uint32_t binary_handle;
        int ret;
 
-       if (NULL == dev)
+       if (!user_dev)
                return -EINVAL;
 
+       dev = user_dev->core;
+
        if (!point)
                return drmSyncobjImportSyncFile(dev->fd, syncobj, sync_file_fd);
 
@@ -827,7 +835,7 @@ drm_public int 
amdgpu_cs_syncobj_transfer(amdgpu_device_handle dev,
        if (NULL == dev)
                return -EINVAL;
 
-       return drmSyncobjTransfer(dev->fd,
+       return drmSyncobjTransfer(dev->core->fd,
                                  dst_handle, dst_point,
                                  src_handle, src_point,
                                  flags);
@@ -854,7 +862,7 @@ drm_public int amdgpu_cs_submit_raw(amdgpu_device_handle 
dev,
        cs.in.ctx_id = context->id;
        cs.in.bo_list_handle = bo_list_handle ? bo_list_handle->handle : 0;
        cs.in.num_chunks = num_chunks;
-       r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_CS,
+       r = drmCommandWriteRead(dev->core->fd, DRM_AMDGPU_CS,
                                &cs, sizeof(cs));
        if (r)
                return r;
@@ -883,7 +891,7 @@ drm_public int amdgpu_cs_submit_raw2(amdgpu_device_handle 
dev,
        cs.in.ctx_id = context->id;
        cs.in.bo_list_handle = bo_list_handle;
        cs.in.num_chunks = num_chunks;
-       r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_CS,
+       r = drmCommandWriteRead(dev->core->fd, DRM_AMDGPU_CS,
                                &cs, sizeof(cs));
        if (!r && seq_no)
                *seq_no = cs.out.handle;
@@ -893,7 +901,7 @@ drm_public int amdgpu_cs_submit_raw2(amdgpu_device_handle 
dev,
 drm_public void amdgpu_cs_chunk_fence_info_to_data(struct amdgpu_cs_fence_info 
*fence_info,
                                        struct drm_amdgpu_cs_chunk_data *data)
 {
-       data->fence_data.handle = fence_info->handle->handle;
+       data->fence_data.handle = fence_info->handle->core->handle;
        data->fence_data.offset = fence_info->offset * sizeof(uint64_t);
 }
 
@@ -923,7 +931,7 @@ drm_public int 
amdgpu_cs_fence_to_handle(amdgpu_device_handle dev,
        fth.in.fence.seq_no = fence->fence;
        fth.in.what = what;
 
-       r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_FENCE_TO_HANDLE,
+       r = drmCommandWriteRead(dev->core->fd, DRM_AMDGPU_FENCE_TO_HANDLE,
                                &fth, sizeof(fth));
        if (r == 0)
                *out_handle = fth.out.handle;
diff --git a/amdgpu/amdgpu_device.c b/amdgpu/amdgpu_device.c
index 76b4e5eb..abf5f942 100644
--- a/amdgpu/amdgpu_device.c
+++ b/amdgpu/amdgpu_device.c
@@ -44,7 +44,7 @@
 #define PTR_TO_UINT(x) ((unsigned)((intptr_t)(x)))
 
 static pthread_mutex_t dev_mutex = PTHREAD_MUTEX_INITIALIZER;
-static amdgpu_device_handle dev_list;
+static struct amdgpu_core_device *dev_list;
 
 static int fd_compare(int fd1, int fd2)
 {
@@ -65,47 +65,15 @@ static int fd_compare(int fd1, int fd2)
        return result;
 }
 
-/**
-* Get the authenticated form fd,
-*
-* \param   fd   - \c [in]  File descriptor for AMD GPU device
-* \param   auth - \c [out] Pointer to output the fd is authenticated or not
-*                          A render node fd, output auth = 0
-*                          A legacy fd, get the authenticated for 
compatibility root
-*
-* \return   0 on success\n
-*          >0 - AMD specific error code\n
-*          <0 - Negative POSIX Error code
-*/
-static int amdgpu_get_auth(int fd, int *auth)
+static void amdgpu_device_free(struct amdgpu_core_device *dev)
 {
-       int r = 0;
-       drm_client_t client = {};
-
-       if (drmGetNodeTypeFromFd(fd) == DRM_NODE_RENDER)
-               *auth = 0;
-       else {
-               client.idx = 0;
-               r = drmIoctl(fd, DRM_IOCTL_GET_CLIENT, &client);
-               if (!r)
-                       *auth = client.auth;
-       }
-       return r;
-}
+       struct amdgpu_core_device **node = &dev_list;
 
-static void amdgpu_device_free_internal(amdgpu_device_handle dev)
-{
-       amdgpu_device_handle *node = &dev_list;
-
-       pthread_mutex_lock(&dev_mutex);
        while (*node != dev && (*node)->next)
                node = &(*node)->next;
        *node = (*node)->next;
-       pthread_mutex_unlock(&dev_mutex);
 
        close(dev->fd);
-       if ((dev->flink_fd >= 0) && (dev->fd != dev->flink_fd))
-               close(dev->flink_fd);
 
        amdgpu_vamgr_deinit(&dev->vamgr_32);
        amdgpu_vamgr_deinit(&dev->vamgr);
@@ -118,87 +86,39 @@ static void 
amdgpu_device_free_internal(amdgpu_device_handle dev)
        free(dev);
 }
 
-/**
- * Assignment between two amdgpu_device pointers with reference counting.
- *
- * Usage:
- *    struct amdgpu_device *dst = ... , *src = ...;
- *
- *    dst = src;
- *    // No reference counting. Only use this when you need to move
- *    // a reference from one pointer to another.
- *
- *    amdgpu_device_reference(&dst, src);
- *    // Reference counters are updated. dst is decremented and src is
- *    // incremented. dst is freed if its reference counter is 0.
- */
-static void amdgpu_device_reference(struct amdgpu_device **dst,
-                                   struct amdgpu_device *src)
+static int amdgpu_device_init(amdgpu_device_handle user_dev)
 {
-       if (update_references(&(*dst)->refcount, &src->refcount))
-               amdgpu_device_free_internal(*dst);
-       *dst = src;
-}
-
-drm_public int amdgpu_device_initialize(int fd,
-                                       uint32_t *major_version,
-                                       uint32_t *minor_version,
-                                       amdgpu_device_handle *device_handle)
-{
-       struct amdgpu_device *dev;
+       struct amdgpu_core_device *dev;
        drmVersionPtr version;
-       int r;
-       int flag_auth = 0;
-       int flag_authexist=0;
-       uint32_t accel_working = 0;
        uint64_t start, max;
-
-       *device_handle = NULL;
-
-       pthread_mutex_lock(&dev_mutex);
-       r = amdgpu_get_auth(fd, &flag_auth);
-       if (r) {
-               fprintf(stderr, "%s: amdgpu_get_auth (1) failed (%i)\n",
-                       __func__, r);
-               pthread_mutex_unlock(&dev_mutex);
-               return r;
-       }
+       int r;
 
        for (dev = dev_list; dev; dev = dev->next)
-               if (fd_compare(dev->fd, fd) == 0)
+               if (fd_compare(dev->fd, user_dev->user_fd) == 0)
                        break;
 
        if (dev) {
-               r = amdgpu_get_auth(dev->fd, &flag_authexist);
-               if (r) {
-                       fprintf(stderr, "%s: amdgpu_get_auth (2) failed (%i)\n",
-                               __func__, r);
-                       pthread_mutex_unlock(&dev_mutex);
-                       return r;
-               }
-               if ((flag_auth) && (!flag_authexist)) {
-                       dev->flink_fd = fcntl(fd, F_DUPFD_CLOEXEC, 0);
-               }
-               *major_version = dev->major_version;
-               *minor_version = dev->minor_version;
-               amdgpu_device_reference(device_handle, dev);
-               pthread_mutex_unlock(&dev_mutex);
+               atomic_inc(&dev->refcount);
+               user_dev->core = dev;
                return 0;
        }
 
-       dev = calloc(1, sizeof(struct amdgpu_device));
+       dev = calloc(1, sizeof(struct amdgpu_core_device));
        if (!dev) {
                fprintf(stderr, "%s: calloc failed\n", __func__);
-               pthread_mutex_unlock(&dev_mutex);
                return -ENOMEM;
        }
 
-       dev->fd = -1;
-       dev->flink_fd = -1;
-
        atomic_set(&dev->refcount, 1);
+       pthread_mutex_init(&dev->bo_table_mutex, NULL);
+
+       dev->fd = user_dev->user_fd;
+       user_dev->core = dev;
+
+       dev->next = dev_list;
+       dev_list = dev;
 
-       version = drmGetVersion(fd);
+       version = drmGetVersion(dev->fd);
        if (version->version_major != 3) {
                fprintf(stderr, "%s: DRM version is %d.%d.%d but this driver is 
"
                        "only compatible with 3.x.x.\n",
@@ -211,28 +131,11 @@ drm_public int amdgpu_device_initialize(int fd,
                goto cleanup;
        }
 
-       dev->fd = fcntl(fd, F_DUPFD_CLOEXEC, 0);
-       dev->flink_fd = dev->fd;
        dev->major_version = version->version_major;
        dev->minor_version = version->version_minor;
        drmFreeVersion(version);
 
-       pthread_mutex_init(&dev->bo_table_mutex, NULL);
-
-       /* Check if acceleration is working. */
-       r = amdgpu_query_info(dev, AMDGPU_INFO_ACCEL_WORKING, 4, 
&accel_working);
-       if (r) {
-               fprintf(stderr, "%s: amdgpu_query_info(ACCEL_WORKING) failed 
(%i)\n",
-                       __func__, r);
-               goto cleanup;
-       }
-       if (!accel_working) {
-               fprintf(stderr, "%s: AMDGPU_INFO_ACCEL_WORKING = 0\n", 
__func__);
-               r = -EBADF;
-               goto cleanup;
-       }
-
-       r = amdgpu_query_gpu_info_init(dev);
+       r = amdgpu_query_gpu_info_init(user_dev);
        if (r) {
                fprintf(stderr, "%s: amdgpu_query_gpu_info_init failed\n", 
__func__);
                goto cleanup;
@@ -261,39 +164,97 @@ drm_public int amdgpu_device_initialize(int fd,
                          dev->dev_info.virtual_address_alignment);
 
        amdgpu_parse_asic_ids(dev);
+       return 0;
 
-       *major_version = dev->major_version;
-       *minor_version = dev->minor_version;
-       *device_handle = dev;
-       dev->next = dev_list;
-       dev_list = dev;
+cleanup:
+       user_dev->core = NULL;
+       close(dev->fd);
+       free(dev);
+       return r;
+}
+
+drm_public int amdgpu_device_initialize(int fd,
+                                       uint32_t *major_version,
+                                       uint32_t *minor_version,
+                                       amdgpu_device_handle *device_handle)
+{
+       struct amdgpu_device *user_dev;
+       uint32_t accel_working = 0;
+       int r;
+
+       *device_handle = NULL;
+
+       user_dev = calloc(1, sizeof(struct amdgpu_device));
+       if (!user_dev) {
+               fprintf(stderr, "%s: calloc failed\n", __func__);
+               return -ENOMEM;
+       }
+
+       user_dev->user_fd = fcntl(fd, F_DUPFD_CLOEXEC, 0);
+
+       pthread_mutex_lock(&dev_mutex);
+
+       r = amdgpu_device_init(user_dev);
+       if (r != 0)
+               goto cleanup;
+
+       /* Check if acceleration is working. */
+       r = amdgpu_query_info(user_dev, AMDGPU_INFO_ACCEL_WORKING, 4, 
&accel_working);
+       if (r) {
+               fprintf(stderr, "%s: amdgpu_query_info(ACCEL_WORKING) failed 
(%i)\n",
+                       __func__, r);
+               goto cleanup;
+       }
+       if (!accel_working) {
+               fprintf(stderr, "%s: AMDGPU_INFO_ACCEL_WORKING = 0\n", 
__func__);
+               r = -EBADF;
+               goto cleanup;
+       }
+
+       *major_version = user_dev->core->major_version;
+       *minor_version = user_dev->core->minor_version;
+       *device_handle = user_dev;
        pthread_mutex_unlock(&dev_mutex);
 
        return 0;
 
 cleanup:
-       if (dev->fd >= 0)
-               close(dev->fd);
-       free(dev);
+       if (!user_dev->core || user_dev->user_fd != user_dev->core->fd)
+               close(user_dev->user_fd);
+       if (user_dev->core && update_references(&user_dev->core->refcount, 
NULL))
+               amdgpu_device_free(user_dev->core);
+       free(user_dev);
        pthread_mutex_unlock(&dev_mutex);
        return r;
 }
 
-drm_public int amdgpu_device_deinitialize(amdgpu_device_handle dev)
+drm_public int amdgpu_device_deinitialize(amdgpu_device_handle user_dev)
 {
-       amdgpu_device_reference(&dev, NULL);
+       struct amdgpu_core_device *dev = user_dev->core;
+
+       pthread_mutex_lock(&dev_mutex);
+
+       if (user_dev->user_fd != dev->fd)
+               close(user_dev->user_fd);
+
+       if (update_references(&dev->refcount, NULL))
+               amdgpu_device_free(dev);
+
+       pthread_mutex_unlock(&dev_mutex);
+       free(user_dev);
        return 0;
 }
 
-drm_public const char *amdgpu_get_marketing_name(amdgpu_device_handle dev)
+drm_public const char *amdgpu_get_marketing_name(amdgpu_device_handle user_dev)
 {
-       return dev->marketing_name;
+       return user_dev->core->marketing_name;
 }
 
-drm_public int amdgpu_query_sw_info(amdgpu_device_handle dev,
+drm_public int amdgpu_query_sw_info(amdgpu_device_handle user_dev,
                                    enum amdgpu_sw_info info,
                                    void *value)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        uint32_t *val32 = (uint32_t*)value;
 
        switch (info) {
diff --git a/amdgpu/amdgpu_gpu_info.c b/amdgpu/amdgpu_gpu_info.c
index 777087f2..7253fbea 100644
--- a/amdgpu/amdgpu_gpu_info.c
+++ b/amdgpu/amdgpu_gpu_info.c
@@ -40,7 +40,7 @@ drm_public int amdgpu_query_info(amdgpu_device_handle dev, 
unsigned info_id,
        request.return_size = size;
        request.query = info_id;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
 
@@ -55,7 +55,7 @@ drm_public int amdgpu_query_crtc_from_id(amdgpu_device_handle 
dev, unsigned id,
        request.query = AMDGPU_INFO_CRTC_FROM_ID;
        request.mode_crtc.id = id;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
 
@@ -74,7 +74,7 @@ drm_public int amdgpu_read_mm_registers(amdgpu_device_handle 
dev,
        request.read_mmr_reg.instance = instance;
        request.read_mmr_reg.flags = flags;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
 
@@ -90,7 +90,7 @@ drm_public int amdgpu_query_hw_ip_count(amdgpu_device_handle 
dev,
        request.query = AMDGPU_INFO_HW_IP_COUNT;
        request.query_hw_ip.type = type;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
 
@@ -107,7 +107,7 @@ drm_public int amdgpu_query_hw_ip_info(amdgpu_device_handle 
dev, unsigned type,
        request.query_hw_ip.type = type;
        request.query_hw_ip.ip_instance = ip_instance;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
 
@@ -127,7 +127,7 @@ drm_public int 
amdgpu_query_firmware_version(amdgpu_device_handle dev,
        request.query_fw.ip_instance = ip_instance;
        request.query_fw.index = index;
 
-       r = drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       r = drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                            sizeof(struct drm_amdgpu_info));
        if (r)
                return r;
@@ -137,11 +137,12 @@ drm_public int 
amdgpu_query_firmware_version(amdgpu_device_handle dev,
        return 0;
 }
 
-drm_private int amdgpu_query_gpu_info_init(amdgpu_device_handle dev)
+drm_private int amdgpu_query_gpu_info_init(amdgpu_device_handle user_dev)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        int r, i;
 
-       r = amdgpu_query_info(dev, AMDGPU_INFO_DEV_INFO, sizeof(dev->dev_info),
+       r = amdgpu_query_info(user_dev, AMDGPU_INFO_DEV_INFO, 
sizeof(dev->dev_info),
                              &dev->dev_info);
        if (r)
                return r;
@@ -172,7 +173,7 @@ drm_private int 
amdgpu_query_gpu_info_init(amdgpu_device_handle dev)
                                            (AMDGPU_INFO_MMR_SH_INDEX_MASK <<
                                             AMDGPU_INFO_MMR_SH_INDEX_SHIFT);
 
-                       r = amdgpu_read_mm_registers(dev, 0x263d, 1, instance, 
0,
+                       r = amdgpu_read_mm_registers(user_dev, 0x263d, 1, 
instance, 0,
                                                     
&dev->info.backend_disable[i]);
                        if (r)
                                return r;
@@ -180,13 +181,13 @@ drm_private int 
amdgpu_query_gpu_info_init(amdgpu_device_handle dev)
                        dev->info.backend_disable[i] =
                                (dev->info.backend_disable[i] >> 16) & 0xff;
 
-                       r = amdgpu_read_mm_registers(dev, 0xa0d4, 1, instance, 
0,
+                       r = amdgpu_read_mm_registers(user_dev, 0xa0d4, 1, 
instance, 0,
                                                     
&dev->info.pa_sc_raster_cfg[i]);
                        if (r)
                                return r;
 
                        if (dev->info.family_id >= AMDGPU_FAMILY_CI) {
-                               r = amdgpu_read_mm_registers(dev, 0xa0d5, 1, 
instance, 0,
+                               r = amdgpu_read_mm_registers(user_dev, 0xa0d5, 
1, instance, 0,
                                                     
&dev->info.pa_sc_raster_cfg1[i]);
                                if (r)
                                        return r;
@@ -194,25 +195,25 @@ drm_private int 
amdgpu_query_gpu_info_init(amdgpu_device_handle dev)
                }
        }
 
-       r = amdgpu_read_mm_registers(dev, 0x263e, 1, 0xffffffff, 0,
+       r = amdgpu_read_mm_registers(user_dev, 0x263e, 1, 0xffffffff, 0,
                                             &dev->info.gb_addr_cfg);
        if (r)
                return r;
 
        if (dev->info.family_id < AMDGPU_FAMILY_AI) {
-               r = amdgpu_read_mm_registers(dev, 0x2644, 32, 0xffffffff, 0,
+               r = amdgpu_read_mm_registers(user_dev, 0x2644, 32, 0xffffffff, 
0,
                                             dev->info.gb_tile_mode);
                if (r)
                        return r;
 
                if (dev->info.family_id >= AMDGPU_FAMILY_CI) {
-                       r = amdgpu_read_mm_registers(dev, 0x2664, 16, 
0xffffffff, 0,
+                       r = amdgpu_read_mm_registers(user_dev, 0x2664, 16, 
0xffffffff, 0,
                                                     
dev->info.gb_macro_tile_mode);
                        if (r)
                                return r;
                }
 
-               r = amdgpu_read_mm_registers(dev, 0x9d8, 1, 0xffffffff, 0,
+               r = amdgpu_read_mm_registers(user_dev, 0x9d8, 1, 0xffffffff, 0,
                                             &dev->info.mc_arb_ramcfg);
                if (r)
                        return r;
@@ -235,7 +236,7 @@ drm_public int amdgpu_query_gpu_info(amdgpu_device_handle 
dev,
                return -EINVAL;
 
        /* Get ASIC info*/
-       *info = dev->info;
+       *info = dev->core->info;
 
        return 0;
 }
@@ -328,6 +329,6 @@ drm_public int 
amdgpu_query_sensor_info(amdgpu_device_handle dev, unsigned senso
        request.query = AMDGPU_INFO_SENSOR;
        request.sensor_info.type = sensor_type;
 
-       return drmCommandWrite(dev->fd, DRM_AMDGPU_INFO, &request,
+       return drmCommandWrite(dev->core->fd, DRM_AMDGPU_INFO, &request,
                               sizeof(struct drm_amdgpu_info));
 }
diff --git a/amdgpu/amdgpu_internal.h b/amdgpu/amdgpu_internal.h
index a340abbd..3a2ab74c 100644
--- a/amdgpu/amdgpu_internal.h
+++ b/amdgpu/amdgpu_internal.h
@@ -64,14 +64,13 @@ struct amdgpu_va {
        struct amdgpu_bo_va_mgr *vamgr;
 };
 
-struct amdgpu_device {
+struct amdgpu_core_device {
        atomic_t refcount;
-       struct amdgpu_device *next;
        int fd;
-       int flink_fd;
        unsigned major_version;
        unsigned minor_version;
 
+       struct amdgpu_core_device *next;
        char *marketing_name;
        /** List of buffer handles. Protected by bo_table_mutex. */
        struct handle_table bo_handles;
@@ -91,9 +90,14 @@ struct amdgpu_device {
        struct amdgpu_bo_va_mgr vamgr_high_32;
 };
 
-struct amdgpu_bo {
+struct amdgpu_device {
+       int user_fd;
+       struct amdgpu_core_device *core;
+};
+
+struct amdgpu_core_bo {
        atomic_t refcount;
-       struct amdgpu_device *dev;
+       amdgpu_bo_handle user_bos;
 
        uint64_t alloc_size;
 
@@ -105,14 +109,21 @@ struct amdgpu_bo {
        int cpu_map_count;
 };
 
-struct amdgpu_bo_list {
+struct amdgpu_bo {
+       atomic_t refcount;
+       struct amdgpu_bo *next;
+       struct amdgpu_core_bo *core;
        struct amdgpu_device *dev;
+};
+
+struct amdgpu_bo_list {
+       struct amdgpu_core_device *dev;
 
        uint32_t handle;
 };
 
 struct amdgpu_context {
-       struct amdgpu_device *dev;
+       struct amdgpu_core_device *dev;
        /** Mutex for accessing fences and to maintain command submissions
            in good sequence. */
        pthread_mutex_t sequence_mutex;
@@ -141,7 +152,7 @@ drm_private void amdgpu_vamgr_init(struct amdgpu_bo_va_mgr 
*mgr, uint64_t start,
 
 drm_private void amdgpu_vamgr_deinit(struct amdgpu_bo_va_mgr *mgr);
 
-drm_private void amdgpu_parse_asic_ids(struct amdgpu_device *dev);
+drm_private void amdgpu_parse_asic_ids(struct amdgpu_core_device *dev);
 
 drm_private int amdgpu_query_gpu_info_init(amdgpu_device_handle dev);
 
diff --git a/amdgpu/amdgpu_vamgr.c b/amdgpu/amdgpu_vamgr.c
index d25d4216..560b84e7 100644
--- a/amdgpu/amdgpu_vamgr.c
+++ b/amdgpu/amdgpu_vamgr.c
@@ -29,10 +29,12 @@
 #include "amdgpu_internal.h"
 #include "util_math.h"
 
-drm_public int amdgpu_va_range_query(amdgpu_device_handle dev,
+drm_public int amdgpu_va_range_query(amdgpu_device_handle user_dev,
                                     enum amdgpu_gpu_va_range type,
                                     uint64_t *start, uint64_t *end)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
+
        if (type != amdgpu_gpu_va_range_general)
                return -EINVAL;
 
@@ -186,7 +188,7 @@ out:
        pthread_mutex_unlock(&mgr->bo_va_mutex);
 }
 
-drm_public int amdgpu_va_range_alloc(amdgpu_device_handle dev,
+drm_public int amdgpu_va_range_alloc(amdgpu_device_handle user_dev,
                                     enum amdgpu_gpu_va_range va_range_type,
                                     uint64_t size,
                                     uint64_t va_base_alignment,
@@ -195,6 +197,7 @@ drm_public int amdgpu_va_range_alloc(amdgpu_device_handle 
dev,
                                     amdgpu_va_handle *va_range_handle,
                                     uint64_t flags)
 {
+       struct amdgpu_core_device *dev = user_dev->core;
        struct amdgpu_bo_va_mgr *vamgr;
 
        /* Clear the flag when the high VA manager is not initialized */
@@ -237,7 +240,7 @@ drm_public int amdgpu_va_range_alloc(amdgpu_device_handle 
dev,
                        amdgpu_vamgr_free_va(vamgr, *va_base_allocated, size);
                        return -ENOMEM;
                }
-               va->dev = dev;
+               va->dev = user_dev;
                va->address = *va_base_allocated;
                va->size = size;
                va->range = va_range_type;
diff --git a/amdgpu/amdgpu_vm.c b/amdgpu/amdgpu_vm.c
index 7e6e28f0..de44e6c2 100644
--- a/amdgpu/amdgpu_vm.c
+++ b/amdgpu/amdgpu_vm.c
@@ -33,7 +33,7 @@ drm_public int amdgpu_vm_reserve_vmid(amdgpu_device_handle 
dev, uint32_t flags)
        vm.in.op = AMDGPU_VM_OP_RESERVE_VMID;
        vm.in.flags = flags;
 
-       return drmCommandWriteRead(dev->fd, DRM_AMDGPU_VM,
+       return drmCommandWriteRead(dev->core->fd, DRM_AMDGPU_VM,
                                   &vm, sizeof(vm));
 }
 
@@ -45,6 +45,6 @@ drm_public int amdgpu_vm_unreserve_vmid(amdgpu_device_handle 
dev,
        vm.in.op = AMDGPU_VM_OP_UNRESERVE_VMID;
        vm.in.flags = flags;
 
-       return drmCommandWriteRead(dev->fd, DRM_AMDGPU_VM,
+       return drmCommandWriteRead(dev->core->fd, DRM_AMDGPU_VM,
                                   &vm, sizeof(vm));
 }
diff --git a/tests/amdgpu/amdgpu_test.c b/tests/amdgpu/amdgpu_test.c
index 73403fb4..7095c4e4 100644
--- a/tests/amdgpu/amdgpu_test.c
+++ b/tests/amdgpu/amdgpu_test.c
@@ -428,7 +428,7 @@ static void amdgpu_disable_suites()
                                   &minor_version, &device_handle))
                return;
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
 
        if (amdgpu_device_deinitialize(device_handle))
                return;
diff --git a/tests/amdgpu/bo_tests.c b/tests/amdgpu/bo_tests.c
index 7cff4cf7..d89c944d 100644
--- a/tests/amdgpu/bo_tests.c
+++ b/tests/amdgpu/bo_tests.c
@@ -309,7 +309,7 @@ static void amdgpu_bo_find_by_cpu_mapping(void)
                                          &offset);
        CU_ASSERT_EQUAL(r, 0);
        CU_ASSERT_EQUAL(offset, 0);
-       CU_ASSERT_EQUAL(bo_handle->handle, find_bo_handle->handle);
+       CU_ASSERT_EQUAL(bo_handle->core->handle, find_bo_handle->core->handle);
 
        atomic_dec(&find_bo_handle->refcount, 1);
        r = amdgpu_bo_unmap_and_free(bo_handle, va_handle,
diff --git a/tests/amdgpu/cs_tests.c b/tests/amdgpu/cs_tests.c
index 7ad0f0dc..8a5f6ed3 100644
--- a/tests/amdgpu/cs_tests.c
+++ b/tests/amdgpu/cs_tests.c
@@ -68,7 +68,7 @@ CU_BOOL suite_cs_tests_enable(void)
                                             &minor_version, &device_handle))
                return CU_FALSE;
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
 
        if (amdgpu_device_deinitialize(device_handle))
                return CU_FALSE;
@@ -101,10 +101,10 @@ int suite_cs_tests_init(void)
                return CUE_SINIT_FAILED;
        }
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
        /* VI asic POLARIS10/11 have specific external_rev_id */
-       chip_rev = device_handle->info.chip_rev;
-       chip_id = device_handle->info.chip_external_rev;
+       chip_rev = device_handle->core->info.chip_rev;
+       chip_id = device_handle->core->info.chip_external_rev;
 
        r = amdgpu_cs_ctx_create(device_handle, &context_handle);
        if (r)
diff --git a/tests/amdgpu/deadlock_tests.c b/tests/amdgpu/deadlock_tests.c
index 91368c15..8526bae7 100644
--- a/tests/amdgpu/deadlock_tests.c
+++ b/tests/amdgpu/deadlock_tests.c
@@ -127,14 +127,14 @@ CU_BOOL suite_deadlock_tests_enable(void)
         * Only enable for ASICs supporting GPU reset and for which it's enabled
         * by default (currently GFX8/9 dGPUS)
         */
-       if (device_handle->info.family_id != AMDGPU_FAMILY_VI &&
-           device_handle->info.family_id != AMDGPU_FAMILY_AI &&
-           device_handle->info.family_id != AMDGPU_FAMILY_CI) {
+       if (device_handle->core->info.family_id != AMDGPU_FAMILY_VI &&
+           device_handle->core->info.family_id != AMDGPU_FAMILY_AI &&
+           device_handle->core->info.family_id != AMDGPU_FAMILY_CI) {
                printf("\n\nGPU reset is not enabled for the ASIC, deadlock 
suite disabled\n");
                enable = CU_FALSE;
        }
 
-       if (device_handle->info.family_id >= AMDGPU_FAMILY_AI)
+       if (device_handle->core->info.family_id >= AMDGPU_FAMILY_AI)
                use_uc_mtype = 1;
 
        if (amdgpu_device_deinitialize(device_handle))
diff --git a/tests/amdgpu/uvd_enc_tests.c b/tests/amdgpu/uvd_enc_tests.c
index b4251bcf..856e7ae1 100644
--- a/tests/amdgpu/uvd_enc_tests.c
+++ b/tests/amdgpu/uvd_enc_tests.c
@@ -114,7 +114,7 @@ int suite_uvd_enc_tests_init(void)
        if (r)
                return CUE_SINIT_FAILED;
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
 
        r = amdgpu_cs_ctx_create(device_handle, &context_handle);
        if (r)
diff --git a/tests/amdgpu/vce_tests.c b/tests/amdgpu/vce_tests.c
index 0026826e..05d9ef57 100644
--- a/tests/amdgpu/vce_tests.c
+++ b/tests/amdgpu/vce_tests.c
@@ -103,10 +103,10 @@ CU_BOOL suite_vce_tests_enable(void)
                                             &minor_version, &device_handle))
                return CU_FALSE;
 
-       family_id = device_handle->info.family_id;
-       chip_rev = device_handle->info.chip_rev;
-       chip_id = device_handle->info.chip_external_rev;
-       ids_flags = device_handle->info.ids_flags;
+       family_id = device_handle->core->info.family_id;
+       chip_rev = device_handle->core->info.chip_rev;
+       chip_id = device_handle->core->info.chip_external_rev;
+       ids_flags = device_handle->core->info.ids_flags;
 
        amdgpu_query_firmware_version(device_handle, AMDGPU_INFO_FW_VCE, 0,
                                          0, &version, &feature);
@@ -153,8 +153,8 @@ int suite_vce_tests_init(void)
                return CUE_SINIT_FAILED;
        }
 
-       family_id = device_handle->info.family_id;
-       vce_harvest_config = device_handle->info.vce_harvest_config;
+       family_id = device_handle->core->info.family_id;
+       vce_harvest_config = device_handle->core->info.vce_harvest_config;
 
        r = amdgpu_cs_ctx_create(device_handle, &context_handle);
        if (r)
diff --git a/tests/amdgpu/vcn_tests.c b/tests/amdgpu/vcn_tests.c
index ad438f35..17248444 100644
--- a/tests/amdgpu/vcn_tests.c
+++ b/tests/amdgpu/vcn_tests.c
@@ -94,7 +94,7 @@ CU_BOOL suite_vcn_tests_enable(void)
                                   &minor_version, &device_handle))
                return CU_FALSE;
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
 
        if (amdgpu_device_deinitialize(device_handle))
                        return CU_FALSE;
@@ -132,7 +132,7 @@ int suite_vcn_tests_init(void)
        if (r)
                return CUE_SINIT_FAILED;
 
-       family_id = device_handle->info.family_id;
+       family_id = device_handle->core->info.family_id;
 
        r = amdgpu_cs_ctx_create(device_handle, &context_handle);
        if (r)
diff --git a/tests/amdgpu/vm_tests.c b/tests/amdgpu/vm_tests.c
index 69bc4683..e52aef25 100644
--- a/tests/amdgpu/vm_tests.c
+++ b/tests/amdgpu/vm_tests.c
@@ -43,7 +43,7 @@ CU_BOOL suite_vm_tests_enable(void)
                                     &minor_version, &device_handle))
                return CU_FALSE;
 
-       if (device_handle->info.family_id == AMDGPU_FAMILY_SI) {
+       if (device_handle->core->info.family_id == AMDGPU_FAMILY_SI) {
                printf("\n\nCurrently hangs the CP on this ASIC, VM suite 
disabled\n");
                enable = CU_FALSE;
        }
-- 
2.20.1

_______________________________________________
dri-devel mailing list
dri-devel@lists.freedesktop.org
https://lists.freedesktop.org/mailman/listinfo/dri-devel

[PATCH libdrm 4/9] amdgpu: Add struct amdgpu_core_device and amdgpu_core_bo

Reply via email to