diff options
author | Evgeny Pinchuk <evgeny.pinchuk@amd.com> | 2014-04-17 15:36:58 +0300 |
---|---|---|
committer | Oded Gabbay <oded.gabbay@amd.com> | 2014-05-04 10:37:15 +0300 |
commit | a4286d57ebc0880331884cb5073eca66a4908698 (patch) | |
tree | 6facf346df73d89b2a8685011ab3d0c21a61bfe9 | |
parent | 6c4e691c342dfbad553a89dc246037ef3dce3b12 (diff) |
hsa/radeon: Exclusive access for perf. counters
Introducing IOCTL implementation for controlling exclusive access to
performance counters.
The exclusive access is per GPU device.
Signed-off-by: Evgeny Pinchuk <evgeny.pinchuk@amd.com>
Signed-off-by: Oded Gabbay <oded.gabbay@amd.com>
-rw-r--r-- | drivers/gpu/hsa/radeon/kfd_chardev.c | 61 | ||||
-rw-r--r-- | drivers/gpu/hsa/radeon/kfd_device.c | 2 | ||||
-rw-r--r-- | drivers/gpu/hsa/radeon/kfd_priv.h | 5 | ||||
-rw-r--r-- | drivers/gpu/hsa/radeon/kfd_process.c | 9 | ||||
-rw-r--r-- | include/uapi/linux/kfd_ioctl.h | 12 |
5 files changed, 88 insertions, 1 deletions
diff --git a/drivers/gpu/hsa/radeon/kfd_chardev.c b/drivers/gpu/hsa/radeon/kfd_chardev.c index 2c2601c11f48..4c4d0cad3456 100644 --- a/drivers/gpu/hsa/radeon/kfd_chardev.c +++ b/drivers/gpu/hsa/radeon/kfd_chardev.c @@ -367,6 +367,59 @@ static int kfd_ioctl_get_process_apertures(struct file *filp, struct kfd_process return 0; } +static long +kfd_ioctl_pmc_acquire_access(struct file *filp, struct kfd_process *p, void __user *arg) +{ + struct kfd_ioctl_pmc_acquire_access_args args; + struct kfd_dev *dev; + int err = -EBUSY; + + if (copy_from_user(&args, arg, sizeof(args))) + return -EFAULT; + + dev = radeon_kfd_device_by_id(args.gpu_id); + if (dev == NULL) + return -EINVAL; + + spin_lock(&dev->pmc_access_lock); + if (dev->pmc_locking_process == NULL) { + dev->pmc_locking_process = p; + dev->pmc_locking_trace = args.trace_id; + err = 0; + } else if (dev->pmc_locking_process == p && dev->pmc_locking_trace == args.trace_id) { + /* Same trace already has an access. Returning success */ + err = 0; + } + + spin_unlock(&dev->pmc_access_lock); + + return err; +} + +static long +kfd_ioctl_pmc_release_access(struct file *filp, struct kfd_process *p, void __user *arg) +{ + struct kfd_ioctl_pmc_release_access_args args; + struct kfd_dev *dev; + int err = -EINVAL; + + if (copy_from_user(&args, arg, sizeof(args))) + return -EFAULT; + + dev = radeon_kfd_device_by_id(args.gpu_id); + if (dev == NULL) + return -EINVAL; + + spin_lock(&dev->pmc_access_lock); + if (dev->pmc_locking_process == p && dev->pmc_locking_trace == args.trace_id) { + dev->pmc_locking_process = NULL; + dev->pmc_locking_trace = 0; + err = 0; + } + spin_unlock(&dev->pmc_access_lock); + + return err; +} static long kfd_ioctl(struct file *filep, unsigned int cmd, unsigned long arg) @@ -403,6 +456,14 @@ kfd_ioctl(struct file *filep, unsigned int cmd, unsigned long arg) err = kfd_ioctl_get_process_apertures(filep, process, (void __user *)arg); break; + case KFD_IOC_PMC_ACQUIRE_ACCESS: + err = kfd_ioctl_pmc_acquire_access(filep, process, (void __user *) arg); + break; + + case KFD_IOC_PMC_RELEASE_ACCESS: + err = kfd_ioctl_pmc_release_access(filep, process, (void __user *) arg); + break; + default: dev_err(kfd_device, "unknown ioctl cmd 0x%x, arg 0x%lx)\n", diff --git a/drivers/gpu/hsa/radeon/kfd_device.c b/drivers/gpu/hsa/radeon/kfd_device.c index 6e5200794cc3..1489e791e061 100644 --- a/drivers/gpu/hsa/radeon/kfd_device.c +++ b/drivers/gpu/hsa/radeon/kfd_device.c @@ -173,6 +173,8 @@ bool kgd2kfd_device_init(struct kfd_dev *kfd, kfd->device_info->scheduler_class->start(kfd->scheduler); + spin_lock_init(&kfd->pmc_access_lock); + kfd->init_complete = true; dev_info(kfd_device, "added device (%x:%x)\n", kfd->pdev->vendor, kfd->pdev->device); diff --git a/drivers/gpu/hsa/radeon/kfd_priv.h b/drivers/gpu/hsa/radeon/kfd_priv.h index 11dc66bdd14e..09051b0dd5d4 100644 --- a/drivers/gpu/hsa/radeon/kfd_priv.h +++ b/drivers/gpu/hsa/radeon/kfd_priv.h @@ -91,6 +91,11 @@ struct kfd_dev { atomic_t interrupt_ring_wptr; struct work_struct interrupt_work; spinlock_t interrupt_lock; + + /* Performance counters exclusivity lock */ + spinlock_t pmc_access_lock; + struct kfd_process *pmc_locking_process; + uint64_t pmc_locking_trace; }; /* KGD2KFD callbacks */ diff --git a/drivers/gpu/hsa/radeon/kfd_process.c b/drivers/gpu/hsa/radeon/kfd_process.c index 8684fc11ad4c..4d7bc75a4934 100644 --- a/drivers/gpu/hsa/radeon/kfd_process.c +++ b/drivers/gpu/hsa/radeon/kfd_process.c @@ -149,8 +149,15 @@ static void free_process(struct kfd_process *p) radeon_kfd_pasid_free(p->pasid); - list_for_each_entry_safe(pdd, temp, &p->per_device_data, per_device_list) + list_for_each_entry_safe(pdd, temp, &p->per_device_data, per_device_list) { + spin_lock(&pdd->dev->pmc_access_lock); + if (pdd->dev->pmc_locking_process == p) { + pdd->dev->pmc_locking_process = NULL; + pdd->dev->pmc_locking_trace = 0; + } + spin_unlock(&pdd->dev->pmc_access_lock); kfree(pdd); + } mutex_destroy(&p->mutex); diff --git a/include/uapi/linux/kfd_ioctl.h b/include/uapi/linux/kfd_ioctl.h index 7c60fa425ecf..005b89a5f40f 100644 --- a/include/uapi/linux/kfd_ioctl.h +++ b/include/uapi/linux/kfd_ioctl.h @@ -95,6 +95,16 @@ struct kfd_ioctl_get_process_apertures_args{ uint8_t num_of_nodes; /* from KFD, should be in the range [1 - NUM_OF_SUPPORTED_GPUS]*/ }; +struct kfd_ioctl_pmc_acquire_access_args { + uint32_t gpu_id; /* to KFD */ + uint64_t trace_id; /* to KFD */ +}; + +struct kfd_ioctl_pmc_release_access_args { + uint32_t gpu_id; /* to KFD */ + uint64_t trace_id; /* to KFD */ +}; + #define KFD_IOC_MAGIC 'K' #define KFD_IOC_GET_VERSION _IOR(KFD_IOC_MAGIC, 1, struct kfd_ioctl_get_version_args) @@ -103,6 +113,8 @@ struct kfd_ioctl_get_process_apertures_args{ #define KFD_IOC_SET_MEMORY_POLICY _IOW(KFD_IOC_MAGIC, 4, struct kfd_ioctl_set_memory_policy_args) #define KFD_IOC_GET_CLOCK_COUNTERS _IOWR(KFD_IOC_MAGIC, 5, struct kfd_ioctl_get_clock_counters_args) #define KFD_IOC_GET_PROCESS_APERTURES _IOR(KFD_IOC_MAGIC, 6, struct kfd_ioctl_get_process_apertures_args) +#define KFD_IOC_PMC_ACQUIRE_ACCESS _IOW(KFD_IOC_MAGIC, 7, struct kfd_ioctl_pmc_acquire_access_args) +#define KFD_IOC_PMC_RELEASE_ACCESS _IOW(KFD_IOC_MAGIC, 8, struct kfd_ioctl_pmc_release_access_args) #pragma pack(pop) |