Home | History | Annotate | Line # | Download | only in vmwgfx
      1 /*	$NetBSD: vmwgfx_page_dirty.c,v 1.2 2021/12/18 23:45:45 riastradh Exp $	*/
      2 
      3 // SPDX-License-Identifier: GPL-2.0 OR MIT
      4 /**************************************************************************
      5  *
      6  * Copyright 2019 VMware, Inc., Palo Alto, CA., USA
      7  *
      8  * Permission is hereby granted, free of charge, to any person obtaining a
      9  * copy of this software and associated documentation files (the
     10  * "Software"), to deal in the Software without restriction, including
     11  * without limitation the rights to use, copy, modify, merge, publish,
     12  * distribute, sub license, and/or sell copies of the Software, and to
     13  * permit persons to whom the Software is furnished to do so, subject to
     14  * the following conditions:
     15  *
     16  * The above copyright notice and this permission notice (including the
     17  * next paragraph) shall be included in all copies or substantial portions
     18  * of the Software.
     19  *
     20  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     21  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     22  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
     23  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
     24  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
     25  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
     26  * USE OR OTHER DEALINGS IN THE SOFTWARE.
     27  *
     28  **************************************************************************/
     29 #include <sys/cdefs.h>
     30 __KERNEL_RCSID(0, "$NetBSD: vmwgfx_page_dirty.c,v 1.2 2021/12/18 23:45:45 riastradh Exp $");
     31 
     32 #include "vmwgfx_drv.h"
     33 
     34 /*
     35  * Different methods for tracking dirty:
     36  * VMW_BO_DIRTY_PAGETABLE - Scan the pagetable for hardware dirty bits
     37  * VMW_BO_DIRTY_MKWRITE - Write-protect page table entries and record write-
     38  * accesses in the VM mkwrite() callback
     39  */
     40 enum vmw_bo_dirty_method {
     41 	VMW_BO_DIRTY_PAGETABLE,
     42 	VMW_BO_DIRTY_MKWRITE,
     43 };
     44 
     45 /*
     46  * No dirtied pages at scan trigger a transition to the _MKWRITE method,
     47  * similarly a certain percentage of dirty pages trigger a transition to
     48  * the _PAGETABLE method. How many triggers should we wait for before
     49  * changing method?
     50  */
     51 #define VMW_DIRTY_NUM_CHANGE_TRIGGERS 2
     52 
     53 /* Percentage to trigger a transition to the _PAGETABLE method */
     54 #define VMW_DIRTY_PERCENTAGE 10
     55 
     56 /**
     57  * struct vmw_bo_dirty - Dirty information for buffer objects
     58  * @start: First currently dirty bit
     59  * @end: Last currently dirty bit + 1
     60  * @method: The currently used dirty method
     61  * @change_count: Number of consecutive method change triggers
     62  * @ref_count: Reference count for this structure
     63  * @bitmap_size: The size of the bitmap in bits. Typically equal to the
     64  * nuber of pages in the bo.
     65  * @size: The accounting size for this struct.
     66  * @bitmap: A bitmap where each bit represents a page. A set bit means a
     67  * dirty page.
     68  */
     69 struct vmw_bo_dirty {
     70 	unsigned long start;
     71 	unsigned long end;
     72 	enum vmw_bo_dirty_method method;
     73 	unsigned int change_count;
     74 	unsigned int ref_count;
     75 	unsigned long bitmap_size;
     76 	size_t size;
     77 	unsigned long bitmap[0];
     78 };
     79 
     80 /**
     81  * vmw_bo_dirty_scan_pagetable - Perform a pagetable scan for dirty bits
     82  * @vbo: The buffer object to scan
     83  *
     84  * Scans the pagetable for dirty bits. Clear those bits and modify the
     85  * dirty structure with the results. This function may change the
     86  * dirty-tracking method.
     87  */
     88 static void vmw_bo_dirty_scan_pagetable(struct vmw_buffer_object *vbo)
     89 {
     90 	struct vmw_bo_dirty *dirty = vbo->dirty;
     91 	pgoff_t offset = drm_vma_node_start(&vbo->base.base.vma_node);
     92 	struct address_space *mapping = vbo->base.bdev->dev_mapping;
     93 	pgoff_t num_marked;
     94 
     95 	num_marked = clean_record_shared_mapping_range
     96 		(mapping,
     97 		 offset, dirty->bitmap_size,
     98 		 offset, &dirty->bitmap[0],
     99 		 &dirty->start, &dirty->end);
    100 	if (num_marked == 0)
    101 		dirty->change_count++;
    102 	else
    103 		dirty->change_count = 0;
    104 
    105 	if (dirty->change_count > VMW_DIRTY_NUM_CHANGE_TRIGGERS) {
    106 		dirty->change_count = 0;
    107 		dirty->method = VMW_BO_DIRTY_MKWRITE;
    108 		wp_shared_mapping_range(mapping,
    109 					offset, dirty->bitmap_size);
    110 		clean_record_shared_mapping_range(mapping,
    111 						  offset, dirty->bitmap_size,
    112 						  offset, &dirty->bitmap[0],
    113 						  &dirty->start, &dirty->end);
    114 	}
    115 }
    116 
    117 /**
    118  * vmw_bo_dirty_scan_mkwrite - Reset the mkwrite dirty-tracking method
    119  * @vbo: The buffer object to scan
    120  *
    121  * Write-protect pages written to so that consecutive write accesses will
    122  * trigger a call to mkwrite.
    123  *
    124  * This function may change the dirty-tracking method.
    125  */
    126 static void vmw_bo_dirty_scan_mkwrite(struct vmw_buffer_object *vbo)
    127 {
    128 	struct vmw_bo_dirty *dirty = vbo->dirty;
    129 	unsigned long offset = drm_vma_node_start(&vbo->base.base.vma_node);
    130 	struct address_space *mapping = vbo->base.bdev->dev_mapping;
    131 	pgoff_t num_marked;
    132 
    133 	if (dirty->end <= dirty->start)
    134 		return;
    135 
    136 	num_marked = wp_shared_mapping_range(vbo->base.bdev->dev_mapping,
    137 					dirty->start + offset,
    138 					dirty->end - dirty->start);
    139 
    140 	if (100UL * num_marked / dirty->bitmap_size >
    141 	    VMW_DIRTY_PERCENTAGE) {
    142 		dirty->change_count++;
    143 	} else {
    144 		dirty->change_count = 0;
    145 	}
    146 
    147 	if (dirty->change_count > VMW_DIRTY_NUM_CHANGE_TRIGGERS) {
    148 		pgoff_t start = 0;
    149 		pgoff_t end = dirty->bitmap_size;
    150 
    151 		dirty->method = VMW_BO_DIRTY_PAGETABLE;
    152 		clean_record_shared_mapping_range(mapping, offset, end, offset,
    153 						  &dirty->bitmap[0],
    154 						  &start, &end);
    155 		bitmap_clear(&dirty->bitmap[0], 0, dirty->bitmap_size);
    156 		if (dirty->start < dirty->end)
    157 			bitmap_set(&dirty->bitmap[0], dirty->start,
    158 				   dirty->end - dirty->start);
    159 		dirty->change_count = 0;
    160 	}
    161 }
    162 
    163 /**
    164  * vmw_bo_dirty_scan - Scan for dirty pages and add them to the dirty
    165  * tracking structure
    166  * @vbo: The buffer object to scan
    167  *
    168  * This function may change the dirty tracking method.
    169  */
    170 void vmw_bo_dirty_scan(struct vmw_buffer_object *vbo)
    171 {
    172 	struct vmw_bo_dirty *dirty = vbo->dirty;
    173 
    174 	if (dirty->method == VMW_BO_DIRTY_PAGETABLE)
    175 		vmw_bo_dirty_scan_pagetable(vbo);
    176 	else
    177 		vmw_bo_dirty_scan_mkwrite(vbo);
    178 }
    179 
    180 /**
    181  * vmw_bo_dirty_pre_unmap - write-protect and pick up dirty pages before
    182  * an unmap_mapping_range operation.
    183  * @vbo: The buffer object,
    184  * @start: First page of the range within the buffer object.
    185  * @end: Last page of the range within the buffer object + 1.
    186  *
    187  * If we're using the _PAGETABLE scan method, we may leak dirty pages
    188  * when calling unmap_mapping_range(). This function makes sure we pick
    189  * up all dirty pages.
    190  */
    191 static void vmw_bo_dirty_pre_unmap(struct vmw_buffer_object *vbo,
    192 				   pgoff_t start, pgoff_t end)
    193 {
    194 	struct vmw_bo_dirty *dirty = vbo->dirty;
    195 	unsigned long offset = drm_vma_node_start(&vbo->base.base.vma_node);
    196 	struct address_space *mapping = vbo->base.bdev->dev_mapping;
    197 
    198 	if (dirty->method != VMW_BO_DIRTY_PAGETABLE || start >= end)
    199 		return;
    200 
    201 	wp_shared_mapping_range(mapping, start + offset, end - start);
    202 	clean_record_shared_mapping_range(mapping, start + offset,
    203 					  end - start, offset,
    204 					  &dirty->bitmap[0], &dirty->start,
    205 					  &dirty->end);
    206 }
    207 
    208 /**
    209  * vmw_bo_dirty_unmap - Clear all ptes pointing to a range within a bo
    210  * @vbo: The buffer object,
    211  * @start: First page of the range within the buffer object.
    212  * @end: Last page of the range within the buffer object + 1.
    213  *
    214  * This is similar to ttm_bo_unmap_virtual_locked() except it takes a subrange.
    215  */
    216 void vmw_bo_dirty_unmap(struct vmw_buffer_object *vbo,
    217 			pgoff_t start, pgoff_t end)
    218 {
    219 	unsigned long offset = drm_vma_node_start(&vbo->base.base.vma_node);
    220 	struct address_space *mapping = vbo->base.bdev->dev_mapping;
    221 
    222 	vmw_bo_dirty_pre_unmap(vbo, start, end);
    223 	unmap_shared_mapping_range(mapping, (offset + start) << PAGE_SHIFT,
    224 				   (loff_t) (end - start) << PAGE_SHIFT);
    225 }
    226 
    227 /**
    228  * vmw_bo_dirty_add - Add a dirty-tracking user to a buffer object
    229  * @vbo: The buffer object
    230  *
    231  * This function registers a dirty-tracking user to a buffer object.
    232  * A user can be for example a resource or a vma in a special user-space
    233  * mapping.
    234  *
    235  * Return: Zero on success, -ENOMEM on memory allocation failure.
    236  */
    237 int vmw_bo_dirty_add(struct vmw_buffer_object *vbo)
    238 {
    239 	struct vmw_bo_dirty *dirty = vbo->dirty;
    240 	pgoff_t num_pages = vbo->base.num_pages;
    241 	size_t size, acc_size;
    242 	int ret;
    243 	static struct ttm_operation_ctx ctx = {
    244 		.interruptible = false,
    245 		.no_wait_gpu = false
    246 	};
    247 
    248 	if (dirty) {
    249 		dirty->ref_count++;
    250 		return 0;
    251 	}
    252 
    253 	size = sizeof(*dirty) + BITS_TO_LONGS(num_pages) * sizeof(long);
    254 	acc_size = ttm_round_pot(size);
    255 	ret = ttm_mem_global_alloc(&ttm_mem_glob, acc_size, &ctx);
    256 	if (ret) {
    257 		VMW_DEBUG_USER("Out of graphics memory for buffer object "
    258 			       "dirty tracker.\n");
    259 		return ret;
    260 	}
    261 	dirty = kvzalloc(size, GFP_KERNEL);
    262 	if (!dirty) {
    263 		ret = -ENOMEM;
    264 		goto out_no_dirty;
    265 	}
    266 
    267 	dirty->size = acc_size;
    268 	dirty->bitmap_size = num_pages;
    269 	dirty->start = dirty->bitmap_size;
    270 	dirty->end = 0;
    271 	dirty->ref_count = 1;
    272 	if (num_pages < PAGE_SIZE / sizeof(pte_t)) {
    273 		dirty->method = VMW_BO_DIRTY_PAGETABLE;
    274 	} else {
    275 		struct address_space *mapping = vbo->base.bdev->dev_mapping;
    276 		pgoff_t offset = drm_vma_node_start(&vbo->base.base.vma_node);
    277 
    278 		dirty->method = VMW_BO_DIRTY_MKWRITE;
    279 
    280 		/* Write-protect and then pick up already dirty bits */
    281 		wp_shared_mapping_range(mapping, offset, num_pages);
    282 		clean_record_shared_mapping_range(mapping, offset, num_pages,
    283 						  offset,
    284 						  &dirty->bitmap[0],
    285 						  &dirty->start, &dirty->end);
    286 	}
    287 
    288 	vbo->dirty = dirty;
    289 
    290 	return 0;
    291 
    292 out_no_dirty:
    293 	ttm_mem_global_free(&ttm_mem_glob, acc_size);
    294 	return ret;
    295 }
    296 
    297 /**
    298  * vmw_bo_dirty_release - Release a dirty-tracking user from a buffer object
    299  * @vbo: The buffer object
    300  *
    301  * This function releases a dirty-tracking user from a buffer object.
    302  * If the reference count reaches zero, then the dirty-tracking object is
    303  * freed and the pointer to it cleared.
    304  *
    305  * Return: Zero on success, -ENOMEM on memory allocation failure.
    306  */
    307 void vmw_bo_dirty_release(struct vmw_buffer_object *vbo)
    308 {
    309 	struct vmw_bo_dirty *dirty = vbo->dirty;
    310 
    311 	if (dirty && --dirty->ref_count == 0) {
    312 		size_t acc_size = dirty->size;
    313 
    314 		kvfree(dirty);
    315 		ttm_mem_global_free(&ttm_mem_glob, acc_size);
    316 		vbo->dirty = NULL;
    317 	}
    318 }
    319 
    320 /**
    321  * vmw_bo_dirty_transfer_to_res - Pick up a resource's dirty region from
    322  * its backing mob.
    323  * @res: The resource
    324  *
    325  * This function will pick up all dirty ranges affecting the resource from
    326  * it's backup mob, and call vmw_resource_dirty_update() once for each
    327  * range. The transferred ranges will be cleared from the backing mob's
    328  * dirty tracking.
    329  */
    330 void vmw_bo_dirty_transfer_to_res(struct vmw_resource *res)
    331 {
    332 	struct vmw_buffer_object *vbo = res->backup;
    333 	struct vmw_bo_dirty *dirty = vbo->dirty;
    334 	pgoff_t start, cur, end;
    335 	unsigned long res_start = res->backup_offset;
    336 	unsigned long res_end = res->backup_offset + res->backup_size;
    337 
    338 	WARN_ON_ONCE(res_start & ~PAGE_MASK);
    339 	res_start >>= PAGE_SHIFT;
    340 	res_end = DIV_ROUND_UP(res_end, PAGE_SIZE);
    341 
    342 	if (res_start >= dirty->end || res_end <= dirty->start)
    343 		return;
    344 
    345 	cur = max(res_start, dirty->start);
    346 	res_end = max(res_end, dirty->end);
    347 	while (cur < res_end) {
    348 		unsigned long num;
    349 
    350 		start = find_next_bit(&dirty->bitmap[0], res_end, cur);
    351 		if (start >= res_end)
    352 			break;
    353 
    354 		end = find_next_zero_bit(&dirty->bitmap[0], res_end, start + 1);
    355 		cur = end + 1;
    356 		num = end - start;
    357 		bitmap_clear(&dirty->bitmap[0], start, num);
    358 		vmw_resource_dirty_update(res, start, end);
    359 	}
    360 
    361 	if (res_start <= dirty->start && res_end > dirty->start)
    362 		dirty->start = res_end;
    363 	if (res_start < dirty->end && res_end >= dirty->end)
    364 		dirty->end = res_start;
    365 }
    366 
    367 /**
    368  * vmw_bo_dirty_clear_res - Clear a resource's dirty region from
    369  * its backing mob.
    370  * @res: The resource
    371  *
    372  * This function will clear all dirty ranges affecting the resource from
    373  * it's backup mob's dirty tracking.
    374  */
    375 void vmw_bo_dirty_clear_res(struct vmw_resource *res)
    376 {
    377 	unsigned long res_start = res->backup_offset;
    378 	unsigned long res_end = res->backup_offset + res->backup_size;
    379 	struct vmw_buffer_object *vbo = res->backup;
    380 	struct vmw_bo_dirty *dirty = vbo->dirty;
    381 
    382 	res_start >>= PAGE_SHIFT;
    383 	res_end = DIV_ROUND_UP(res_end, PAGE_SIZE);
    384 
    385 	if (res_start >= dirty->end || res_end <= dirty->start)
    386 		return;
    387 
    388 	res_start = max(res_start, dirty->start);
    389 	res_end = min(res_end, dirty->end);
    390 	bitmap_clear(&dirty->bitmap[0], res_start, res_end - res_start);
    391 
    392 	if (res_start <= dirty->start && res_end > dirty->start)
    393 		dirty->start = res_end;
    394 	if (res_start < dirty->end && res_end >= dirty->end)
    395 		dirty->end = res_start;
    396 }
    397 
    398 vm_fault_t vmw_bo_vm_mkwrite(struct vm_fault *vmf)
    399 {
    400 	struct vm_area_struct *vma = vmf->vma;
    401 	struct ttm_buffer_object *bo = (struct ttm_buffer_object *)
    402 	    vma->vm_private_data;
    403 	vm_fault_t ret;
    404 	unsigned long page_offset;
    405 	unsigned int save_flags;
    406 	struct vmw_buffer_object *vbo =
    407 		container_of(bo, typeof(*vbo), base);
    408 
    409 	/*
    410 	 * mkwrite() doesn't handle the VM_FAULT_RETRY return value correctly.
    411 	 * So make sure the TTM helpers are aware.
    412 	 */
    413 	save_flags = vmf->flags;
    414 	vmf->flags &= ~FAULT_FLAG_ALLOW_RETRY;
    415 	ret = ttm_bo_vm_reserve(bo, vmf);
    416 	vmf->flags = save_flags;
    417 	if (ret)
    418 		return ret;
    419 
    420 	page_offset = vmf->pgoff - drm_vma_node_start(&bo->base.vma_node);
    421 	if (unlikely(page_offset >= bo->num_pages)) {
    422 		ret = VM_FAULT_SIGBUS;
    423 		goto out_unlock;
    424 	}
    425 
    426 	if (vbo->dirty && vbo->dirty->method == VMW_BO_DIRTY_MKWRITE &&
    427 	    !test_bit(page_offset, &vbo->dirty->bitmap[0])) {
    428 		struct vmw_bo_dirty *dirty = vbo->dirty;
    429 
    430 		__set_bit(page_offset, &dirty->bitmap[0]);
    431 		dirty->start = min(dirty->start, page_offset);
    432 		dirty->end = max(dirty->end, page_offset + 1);
    433 	}
    434 
    435 out_unlock:
    436 	dma_resv_unlock(bo->base.resv);
    437 	return ret;
    438 }
    439 
    440 vm_fault_t vmw_bo_vm_fault(struct vm_fault *vmf)
    441 {
    442 	struct vm_area_struct *vma = vmf->vma;
    443 	struct ttm_buffer_object *bo = (struct ttm_buffer_object *)
    444 	    vma->vm_private_data;
    445 	struct vmw_buffer_object *vbo =
    446 		container_of(bo, struct vmw_buffer_object, base);
    447 	pgoff_t num_prefault;
    448 	pgprot_t prot;
    449 	vm_fault_t ret;
    450 
    451 	ret = ttm_bo_vm_reserve(bo, vmf);
    452 	if (ret)
    453 		return ret;
    454 
    455 	num_prefault = (vma->vm_flags & VM_RAND_READ) ? 1 :
    456 		TTM_BO_VM_NUM_PREFAULT;
    457 
    458 	if (vbo->dirty) {
    459 		pgoff_t allowed_prefault;
    460 		unsigned long page_offset;
    461 
    462 		page_offset = vmf->pgoff -
    463 			drm_vma_node_start(&bo->base.vma_node);
    464 		if (page_offset >= bo->num_pages ||
    465 		    vmw_resources_clean(vbo, page_offset,
    466 					page_offset + PAGE_SIZE,
    467 					&allowed_prefault)) {
    468 			ret = VM_FAULT_SIGBUS;
    469 			goto out_unlock;
    470 		}
    471 
    472 		num_prefault = min(num_prefault, allowed_prefault);
    473 	}
    474 
    475 	/*
    476 	 * If we don't track dirty using the MKWRITE method, make sure
    477 	 * sure the page protection is write-enabled so we don't get
    478 	 * a lot of unnecessary write faults.
    479 	 */
    480 	if (vbo->dirty && vbo->dirty->method == VMW_BO_DIRTY_MKWRITE)
    481 		prot = vma->vm_page_prot;
    482 	else
    483 		prot = vm_get_page_prot(vma->vm_flags);
    484 
    485 	ret = ttm_bo_vm_fault_reserved(vmf, prot, num_prefault);
    486 	if (ret == VM_FAULT_RETRY && !(vmf->flags & FAULT_FLAG_RETRY_NOWAIT))
    487 		return ret;
    488 
    489 out_unlock:
    490 	dma_resv_unlock(bo->base.resv);
    491 
    492 	return ret;
    493 }
    494