diff options
author | Jérôme Glisse <jglisse@redhat.com> | 2016-11-07 17:55:19 -0500 |
---|---|---|
committer | Jérôme Glisse <jglisse@redhat.com> | 2017-01-12 11:15:38 -0500 |
commit | 6c1c5559dbd7fb3c59c326e95e031afdeb60f63b (patch) | |
tree | 54d81a763f57b516f9b92dab4aab890a89a178ef | |
parent | cf3a8908d899665bd5b9ed816fb21cdd0ce3a45b (diff) |
hmm/dmirror: dummy mirror support for fake device memoryhmm-stable
Add fake device memory.
Signed-off-by: Jérôme Glisse <jglisse@redhat.com>
-rw-r--r-- | drivers/char/hmm_dmirror.c | 320 | ||||
-rw-r--r-- | include/uapi/linux/hmm_dmirror.h | 6 |
2 files changed, 326 insertions, 0 deletions
diff --git a/drivers/char/hmm_dmirror.c b/drivers/char/hmm_dmirror.c index 8465f3adb2ee..8f6ac308a31e 100644 --- a/drivers/char/hmm_dmirror.c +++ b/drivers/char/hmm_dmirror.c @@ -75,6 +75,13 @@ struct dmirror_device { dev_t dev; struct cdev cdevice; struct platform_device *pdevice; + struct hmm_device *hmm_device; + struct page *frees; + struct hmm_devmem devmem; + spinlock_t lock; + + unsigned long calloc; + unsigned long cfree; }; static inline unsigned long dmirror_pt_pgd(unsigned long addr) @@ -406,12 +413,16 @@ static int dummy_fops_open(struct inode *inode, struct file *filp) static int dummy_fops_release(struct inode *inode, struct file *filp) { + struct dmirror_device *mdevice; struct dmirror *dmirror; if (!filp->private_data) return 0; dmirror = filp->private_data; + mdevice = dmirror->mdevice; + printk(KERN_INFO "DEVICE PAGE %ld %ld (%ld)\n", mdevice->calloc, mdevice->cfree, mdevice->calloc - mdevice->cfree); + dmirror_del(dmirror); filp->private_data = NULL; @@ -538,6 +549,14 @@ static int dummy_fault(struct dmirror *dmirror, return 0; } +static bool dummy_device_is_mine(struct dmirror_device *mdevice, + struct page *page) +{ + if (!is_zone_device_page(page)) + return false; + return page->pgmap->data == &mdevice->devmem; +} + static int dummy_do_read(struct dmirror *dmirror, unsigned long addr, unsigned long end, @@ -558,6 +577,11 @@ static int dummy_do_read(struct dmirror *dmirror, if (!page) { return -ENOENT; } + if (is_zone_device_page(page)) { + if (!dummy_device_is_mine(mdevice, page)) + return -ENOENT; + page = (void *)hmm_devmem_page_get_drvdata(page); + } tmp = kmap(page); memcpy(ptr, tmp, PAGE_SIZE); @@ -633,6 +657,11 @@ static int dummy_do_write(struct dmirror *dmirror, page = dmirror_pt_page(*dpte); if (!page || !(*dpte & DPT_WRITE)) return -ENOENT; + if (is_zone_device_page(page)) { + if (!dummy_device_is_mine(mdevice, page)) + return -ENOENT; + page = (void *)hmm_devmem_page_get_drvdata(page); + } tmp = kmap(page); memcpy(tmp, ptr, PAGE_SIZE); @@ -691,11 +720,164 @@ again: return 0; } +static struct page *dummy_device_alloc_page(struct dmirror_device *mdevice) +{ + struct page *dpage = NULL, *rpage; + + /* + * This is a fake device so we alloc real system memory to fake + * our device memory + */ + rpage = alloc_page(GFP_HIGHUSER); + if (!rpage) + return NULL; + + spin_lock(&mdevice->lock); + if (mdevice->frees) { + dpage = mdevice->frees; + mdevice->frees = dpage->s_mem; + } else { + spin_unlock(&mdevice->lock); + __free_page(rpage); + return NULL; + } + + if (!trylock_page(dpage)) { + dpage->s_mem = mdevice->frees; + mdevice->frees = dpage; + spin_unlock(&mdevice->lock); + __free_page(rpage); + return NULL; + } + spin_unlock(&mdevice->lock); + + mdevice->calloc++; + hmm_devmem_page_set_drvdata(dpage, (unsigned long)rpage); + get_page(dpage); + return dpage; +} + +struct dummy_migrate { + struct dmirror_device *mdevice; + struct hmm_dmirror_migrate *dmigrate; +}; + +static void dummy_migrate_alloc_and_copy(struct vm_area_struct *vma, + const hmm_pfn_t *src_pfns, + hmm_pfn_t *dst_pfns, + unsigned long start, + unsigned long end, + void *private) +{ + struct dummy_migrate *dmigrate = private; + struct dmirror_device *mdevice; + unsigned long addr; + + if (!dmigrate) + return; + + mdevice = dmigrate->mdevice; + + for (addr=start; addr<end; addr+=PAGE_SIZE, src_pfns++, dst_pfns++) { + struct page *spage = hmm_pfn_to_page(*src_pfns); + struct page *dpage, *rpage; + + if (!spage || !(*src_pfns & HMM_PFN_MIGRATE)) + continue; + if (*src_pfns & HMM_PFN_DEVICE) { + if (!dummy_device_is_mine(mdevice, spage)) { + continue; + } + spage = (void *)hmm_devmem_page_get_drvdata(spage); + } + + dpage = dummy_device_alloc_page(mdevice); + if (!dpage) + continue; + + rpage = (void *)hmm_devmem_page_get_drvdata(dpage); + + copy_highpage(rpage, spage); + *dst_pfns = hmm_pfn_from_page(dpage) | + HMM_PFN_MIGRATE | HMM_PFN_LOCKED; + } +} + +static void dummy_migrate_finalize_and_map(struct vm_area_struct *vma, + const hmm_pfn_t *src_pfns, + hmm_pfn_t *dst_pfns, + unsigned long start, + unsigned long end, + void *private) +{ + struct dummy_migrate *dmigrate = private; + unsigned long addr; + + if (!dmigrate || !dmigrate->dmigrate) + return; + + for (addr=start; addr<end; addr+=PAGE_SIZE, src_pfns++, dst_pfns++) { + struct page *page = hmm_pfn_to_page(*dst_pfns); + + if (!(*src_pfns & HMM_PFN_MIGRATE)) + continue; + if (!dummy_device_is_mine(dmigrate->mdevice, page)) + continue; + dmigrate->dmigrate->npages++; + } +} + +static const struct hmm_migrate_ops dmirror_migrate_ops = { + .alloc_and_copy = dummy_migrate_alloc_and_copy, + .finalize_and_map = dummy_migrate_finalize_and_map, +}; + +static int dummy_migrate(struct dmirror *dmirror, + struct hmm_dmirror_migrate *dmigrate) +{ + unsigned long addr = dmigrate->addr, end; + struct mm_struct *mm = dmirror->mm; + struct vm_area_struct *vma; + struct dummy_migrate tmp; + int ret; + + tmp.mdevice = dmirror->mdevice; + tmp.dmigrate = dmigrate; + + down_read(&mm->mmap_sem); + end = addr + (dmigrate->npages << PAGE_SHIFT); + vma = find_vma_intersection(mm, addr, end); + if (!vma || vma->vm_start > addr || vma->vm_end < end) { + ret = -EINVAL; + goto out; + } + + for (dmigrate->npages = 0; addr < end;) { + hmm_pfn_t src_pfns[64]; + hmm_pfn_t dst_pfns[64]; + unsigned long next; + + next = min(end, addr + (64 << PAGE_SHIFT)); + + ret = hmm_vma_migrate(&dmirror_migrate_ops, vma, src_pfns, + dst_pfns, addr, next, &tmp); + if (ret) + goto out; + + addr = next; + } + +out: + up_read(&mm->mmap_sem); + return ret; +} + static long dummy_fops_unlocked_ioctl(struct file *filp, unsigned int command, unsigned long arg) { void __user *uarg = (void __user *)arg; + struct hmm_dmirror_migrate dmigrate; struct hmm_dmirror_write dwrite; struct hmm_dmirror_read dread; struct dmirror *dmirror; @@ -726,6 +908,16 @@ static long dummy_fops_unlocked_ioctl(struct file *filp, return ret; return copy_to_user(uarg, &dwrite, sizeof(dwrite)); + case HMM_DMIRROR_MIGRATE: + ret = copy_from_user(&dmigrate, uarg, sizeof(dmigrate)); + if (ret) + return ret; + + ret = dummy_migrate(dmirror, &dmigrate); + if (ret) + return ret; + + return copy_to_user(uarg, &dmigrate, sizeof(dmigrate)); default: ret = -EINVAL; break; @@ -745,13 +937,123 @@ static const struct file_operations dmirror_fops = { .owner = THIS_MODULE, }; +static void dummy_devmem_free(struct hmm_devmem *devmem, + struct page *page) +{ + struct dmirror_device *mdevice; + struct page *rpage; + + mdevice = container_of(devmem, struct dmirror_device, devmem); + rpage = (struct page *)hmm_devmem_page_get_drvdata(page); + __free_page(rpage); + mdevice->cfree++; + + spin_lock(&mdevice->lock); + page->s_mem = mdevice->frees; + mdevice->frees = page; + spin_unlock(&mdevice->lock); +} + +struct dummy_devmem_fault { + struct dmirror_device *mdevice; +}; + +static void dummy_devmem_fault_alloc_and_copy(struct vm_area_struct *vma, + const hmm_pfn_t *src_pfns, + hmm_pfn_t *dst_pfns, + unsigned long start, + unsigned long end, + void *private) +{ + struct dummy_devmem_fault *fault = private; + unsigned long addr; + + for (addr=start; addr<end; addr+=PAGE_SIZE, src_pfns++, dst_pfns++) { + struct page *dpage, *spage; + + spage = hmm_pfn_to_page(*src_pfns); + if (!spage || !(*src_pfns & HMM_PFN_MIGRATE)) + continue; + if (!dummy_device_is_mine(fault->mdevice, spage)) { + *dst_pfns = HMM_PFN_ERROR; + continue; + } + spage = (void *)hmm_devmem_page_get_drvdata(spage); + + dpage = hmm_vma_alloc_locked_page(vma, addr); + if (!dpage) { + *dst_pfns = HMM_PFN_ERROR; + continue; + } + + copy_highpage(dpage, spage); + *dst_pfns = hmm_pfn_from_page(dpage) | + HMM_PFN_MIGRATE | + HMM_PFN_LOCKED; + } +} + +void dummy_devmem_fault_finalize_and_map(struct vm_area_struct *vma, + const hmm_pfn_t *src_pfns, + hmm_pfn_t *dst_pfns, + unsigned long start, + unsigned long end, + void *private) +{ +} + +static const struct hmm_migrate_ops dummy_devmem_migrate = { + .alloc_and_copy = dummy_devmem_fault_alloc_and_copy, + .finalize_and_map = dummy_devmem_fault_finalize_and_map, +}; + +static int dummy_devmem_fault(struct hmm_devmem *devmem, + struct vm_area_struct *vma, + unsigned long addr, + struct page *page, + unsigned flags, + pmd_t *pmdp) +{ + hmm_pfn_t src_pfns = HMM_PFN_MIGRATE, dst_pfns = 0; + struct dummy_devmem_fault fault; + unsigned long start, end; + + fault.mdevice = container_of(devmem, struct dmirror_device, devmem); + + /* FIXME demonstrate how we can adjust migrate range */ + start = addr; + end = addr + PAGE_SIZE; + return hmm_devmem_fault_range(devmem, vma, &dummy_devmem_migrate, + &src_pfns, &dst_pfns, start, + addr, end, &fault); +} + +static const struct hmm_devmem_ops dmirror_devmem_ops = { + .free = dummy_devmem_free, + .fault = dummy_devmem_fault, +}; + static int dmirror_probe(struct platform_device *pdev) { struct dmirror_device *mdevice = platform_get_drvdata(pdev); + struct hmm_devmem *devmem = &mdevice->devmem; + unsigned long pfn; int ret; + mdevice->hmm_device = hmm_device_new(); + if (IS_ERR(mdevice->hmm_device)) + return PTR_ERR(mdevice->hmm_device); + ret = hmm_devmem_add(&mdevice->devmem, &dmirror_devmem_ops, + &mdevice->hmm_device->device, 64 << 20); + if (ret) { + hmm_device_put(mdevice->hmm_device); + return ret; + } + ret = alloc_chrdev_region(&mdevice->dev, 0, 1, "HMM_DMIRROR"); if (ret < 0) { + hmm_devmem_remove(&mdevice->devmem); + hmm_device_put(mdevice->hmm_device); return ret; } @@ -759,9 +1061,24 @@ static int dmirror_probe(struct platform_device *pdev) ret = cdev_add(&mdevice->cdevice, mdevice->dev, 1); if (ret) { unregister_chrdev_region(mdevice->dev, 1); + hmm_devmem_remove(&mdevice->devmem); + hmm_device_put(mdevice->hmm_device); return ret; } + /* Build list of free struct page */ + spin_lock_init(&mdevice->lock); + mdevice->frees = NULL; + for (pfn = devmem->pfn_first; pfn < devmem->pfn_last; pfn++) { + struct page *page = pfn_to_page(pfn); + + page->s_mem = mdevice->frees; + mdevice->frees = page; + } + + mdevice->calloc = 0; + mdevice->cfree = 0; + return 0; } @@ -769,6 +1086,9 @@ static int dmirror_remove(struct platform_device *pdev) { struct dmirror_device *mdevice = platform_get_drvdata(pdev); + if (!hmm_devmem_remove(&mdevice->devmem)) + printk(KERN_INFO "HMM device memory still in use !\n"); + hmm_device_put(mdevice->hmm_device); cdev_del(&mdevice->cdevice); unregister_chrdev_region(mdevice->dev, 1); return 0; diff --git a/include/uapi/linux/hmm_dmirror.h b/include/uapi/linux/hmm_dmirror.h index b6b147a04d2c..add818fb28d8 100644 --- a/include/uapi/linux/hmm_dmirror.h +++ b/include/uapi/linux/hmm_dmirror.h @@ -41,8 +41,14 @@ struct hmm_dmirror_write { uint64_t dpages; }; +struct hmm_dmirror_migrate { + uint64_t addr; + uint64_t npages; +}; + /* Expose the address space of the calling process through hmm dummy dev file */ #define HMM_DMIRROR_READ _IOWR('H', 0x00, struct hmm_dmirror_read) #define HMM_DMIRROR_WRITE _IOWR('H', 0x01, struct hmm_dmirror_write) +#define HMM_DMIRROR_MIGRATE _IOWR('H', 0x02, struct hmm_dmirror_migrate) #endif /* _UAPI_LINUX_HMM_DMIRROR_H */ |