1 /* 2 * Copyright (C) 2012-2014 Canonical Ltd (Maarten Lankhorst) 3 * 4 * Based on bo.c which bears the following copyright notice, 5 * but is dual licensed: 6 * 7 * Copyright (c) 2006-2009 VMware, Inc., Palo Alto, CA., USA 8 * All Rights Reserved. 9 * 10 * Permission is hereby granted, free of charge, to any person obtaining a 11 * copy of this software and associated documentation files (the 12 * "Software"), to deal in the Software without restriction, including 13 * without limitation the rights to use, copy, modify, merge, publish, 14 * distribute, sub license, and/or sell copies of the Software, and to 15 * permit persons to whom the Software is furnished to do so, subject to 16 * the following conditions: 17 * 18 * The above copyright notice and this permission notice (including the 19 * next paragraph) shall be included in all copies or substantial portions 20 * of the Software. 21 * 22 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 23 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 24 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 25 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, 26 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 27 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 28 * USE OR OTHER DEALINGS IN THE SOFTWARE. 29 * 30 **************************************************************************/ 31 /* 32 * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com> 33 */ 34 35 #include <linux/dma-resv.h> 36 #include <linux/export.h> 37 #include <linux/sched/mm.h> 38 39 /** 40 * DOC: Reservation Object Overview 41 * 42 * The reservation object provides a mechanism to manage shared and 43 * exclusive fences associated with a buffer. A reservation object 44 * can have attached one exclusive fence (normally associated with 45 * write operations) or N shared fences (read operations). The RCU 46 * mechanism is used to protect read access to fences from locked 47 * write-side updates. 48 */ 49 50 DEFINE_WD_CLASS(reservation_ww_class); 51 EXPORT_SYMBOL(reservation_ww_class); 52 53 struct lock_class_key reservation_seqcount_class; 54 EXPORT_SYMBOL(reservation_seqcount_class); 55 56 const char reservation_seqcount_string[] = "reservation_seqcount"; 57 EXPORT_SYMBOL(reservation_seqcount_string); 58 59 /** 60 * dma_resv_list_alloc - allocate fence list 61 * @shared_max: number of fences we need space for 62 * 63 * Allocate a new dma_resv_list and make sure to correctly initialize 64 * shared_max. 65 */ 66 static struct dma_resv_list *dma_resv_list_alloc(unsigned int shared_max) 67 { 68 struct dma_resv_list *list; 69 70 list = kmalloc(offsetof(typeof(*list), shared[shared_max]), GFP_KERNEL); 71 if (!list) 72 return NULL; 73 74 #ifdef __linux__ 75 list->shared_max = (ksize(list) - offsetof(typeof(*list), shared)) / 76 sizeof(*list->shared); 77 #else 78 list->shared_max = (offsetof(typeof(*list), shared[shared_max]) - 79 offsetof(typeof(*list), shared)) / sizeof(*list->shared); 80 #endif 81 82 return list; 83 } 84 85 /** 86 * dma_resv_list_free - free fence list 87 * @list: list to free 88 * 89 * Free a dma_resv_list and make sure to drop all references. 90 */ 91 static void dma_resv_list_free(struct dma_resv_list *list) 92 { 93 unsigned int i; 94 95 if (!list) 96 return; 97 98 for (i = 0; i < list->shared_count; ++i) 99 dma_fence_put(rcu_dereference_protected(list->shared[i], true)); 100 101 kfree_rcu(list, rcu); 102 } 103 104 #if IS_ENABLED(CONFIG_LOCKDEP) 105 static int __init dma_resv_lockdep(void) 106 { 107 struct mm_struct *mm = mm_alloc(); 108 struct ww_acquire_ctx ctx; 109 struct dma_resv obj; 110 int ret; 111 112 if (!mm) 113 return -ENOMEM; 114 115 dma_resv_init(&obj); 116 117 down_read(&mm->mmap_sem); 118 ww_acquire_init(&ctx, &reservation_ww_class); 119 ret = dma_resv_lock(&obj, &ctx); 120 if (ret == -EDEADLK) 121 dma_resv_lock_slow(&obj, &ctx); 122 fs_reclaim_acquire(GFP_KERNEL); 123 fs_reclaim_release(GFP_KERNEL); 124 ww_mutex_unlock(&obj.lock); 125 ww_acquire_fini(&ctx); 126 up_read(&mm->mmap_sem); 127 128 mmput(mm); 129 130 return 0; 131 } 132 subsys_initcall(dma_resv_lockdep); 133 #endif 134 135 /** 136 * dma_resv_init - initialize a reservation object 137 * @obj: the reservation object 138 */ 139 void dma_resv_init(struct dma_resv *obj) 140 { 141 ww_mutex_init(&obj->lock, &reservation_ww_class); 142 143 __seqcount_init(&obj->seq, reservation_seqcount_string, 144 &reservation_seqcount_class); 145 RCU_INIT_POINTER(obj->fence, NULL); 146 RCU_INIT_POINTER(obj->fence_excl, NULL); 147 } 148 EXPORT_SYMBOL(dma_resv_init); 149 150 /** 151 * dma_resv_fini - destroys a reservation object 152 * @obj: the reservation object 153 */ 154 void dma_resv_fini(struct dma_resv *obj) 155 { 156 struct dma_resv_list *fobj; 157 struct dma_fence *excl; 158 159 /* 160 * This object should be dead and all references must have 161 * been released to it, so no need to be protected with rcu. 162 */ 163 excl = rcu_dereference_protected(obj->fence_excl, 1); 164 if (excl) 165 dma_fence_put(excl); 166 167 fobj = rcu_dereference_protected(obj->fence, 1); 168 dma_resv_list_free(fobj); 169 ww_mutex_destroy(&obj->lock); 170 } 171 EXPORT_SYMBOL(dma_resv_fini); 172 173 /** 174 * dma_resv_reserve_shared - Reserve space to add shared fences to 175 * a dma_resv. 176 * @obj: reservation object 177 * @num_fences: number of fences we want to add 178 * 179 * Should be called before dma_resv_add_shared_fence(). Must 180 * be called with obj->lock held. 181 * 182 * RETURNS 183 * Zero for success, or -errno 184 */ 185 int dma_resv_reserve_shared(struct dma_resv *obj, unsigned int num_fences) 186 { 187 struct dma_resv_list *old, *new; 188 unsigned int i, j, k, max; 189 190 dma_resv_assert_held(obj); 191 192 old = dma_resv_get_list(obj); 193 194 if (old && old->shared_max) { 195 if ((old->shared_count + num_fences) <= old->shared_max) 196 return 0; 197 else 198 max = max(old->shared_count + num_fences, 199 old->shared_max * 2); 200 } else { 201 max = 4; 202 } 203 204 new = dma_resv_list_alloc(max); 205 if (!new) 206 return -ENOMEM; 207 208 /* 209 * no need to bump fence refcounts, rcu_read access 210 * requires the use of kref_get_unless_zero, and the 211 * references from the old struct are carried over to 212 * the new. 213 */ 214 for (i = 0, j = 0, k = max; i < (old ? old->shared_count : 0); ++i) { 215 struct dma_fence *fence; 216 217 fence = rcu_dereference_protected(old->shared[i], 218 dma_resv_held(obj)); 219 if (dma_fence_is_signaled(fence)) 220 RCU_INIT_POINTER(new->shared[--k], fence); 221 else 222 RCU_INIT_POINTER(new->shared[j++], fence); 223 } 224 new->shared_count = j; 225 226 /* 227 * We are not changing the effective set of fences here so can 228 * merely update the pointer to the new array; both existing 229 * readers and new readers will see exactly the same set of 230 * active (unsignaled) shared fences. Individual fences and the 231 * old array are protected by RCU and so will not vanish under 232 * the gaze of the rcu_read_lock() readers. 233 */ 234 rcu_assign_pointer(obj->fence, new); 235 236 if (!old) 237 return 0; 238 239 /* Drop the references to the signaled fences */ 240 for (i = k; i < max; ++i) { 241 struct dma_fence *fence; 242 243 fence = rcu_dereference_protected(new->shared[i], 244 dma_resv_held(obj)); 245 dma_fence_put(fence); 246 } 247 kfree_rcu(old, rcu); 248 249 return 0; 250 } 251 EXPORT_SYMBOL(dma_resv_reserve_shared); 252 253 /** 254 * dma_resv_add_shared_fence - Add a fence to a shared slot 255 * @obj: the reservation object 256 * @fence: the shared fence to add 257 * 258 * Add a fence to a shared slot, obj->lock must be held, and 259 * dma_resv_reserve_shared() has been called. 260 */ 261 void dma_resv_add_shared_fence(struct dma_resv *obj, struct dma_fence *fence) 262 { 263 struct dma_resv_list *fobj; 264 struct dma_fence *old; 265 unsigned int i, count; 266 267 dma_fence_get(fence); 268 269 dma_resv_assert_held(obj); 270 271 fobj = dma_resv_get_list(obj); 272 count = fobj->shared_count; 273 274 preempt_disable(); 275 write_seqcount_begin(&obj->seq); 276 277 for (i = 0; i < count; ++i) { 278 279 old = rcu_dereference_protected(fobj->shared[i], 280 dma_resv_held(obj)); 281 if (old->context == fence->context || 282 dma_fence_is_signaled(old)) 283 goto replace; 284 } 285 286 BUG_ON(fobj->shared_count >= fobj->shared_max); 287 old = NULL; 288 count++; 289 290 replace: 291 RCU_INIT_POINTER(fobj->shared[i], fence); 292 /* pointer update must be visible before we extend the shared_count */ 293 smp_store_mb(fobj->shared_count, count); 294 295 write_seqcount_end(&obj->seq); 296 preempt_enable(); 297 dma_fence_put(old); 298 } 299 EXPORT_SYMBOL(dma_resv_add_shared_fence); 300 301 /** 302 * dma_resv_add_excl_fence - Add an exclusive fence. 303 * @obj: the reservation object 304 * @fence: the shared fence to add 305 * 306 * Add a fence to the exclusive slot. The obj->lock must be held. 307 */ 308 void dma_resv_add_excl_fence(struct dma_resv *obj, struct dma_fence *fence) 309 { 310 struct dma_fence *old_fence = dma_resv_get_excl(obj); 311 struct dma_resv_list *old; 312 u32 i = 0; 313 314 dma_resv_assert_held(obj); 315 316 old = dma_resv_get_list(obj); 317 if (old) 318 i = old->shared_count; 319 320 if (fence) 321 dma_fence_get(fence); 322 323 preempt_disable(); 324 write_seqcount_begin(&obj->seq); 325 /* write_seqcount_begin provides the necessary memory barrier */ 326 RCU_INIT_POINTER(obj->fence_excl, fence); 327 if (old) 328 old->shared_count = 0; 329 write_seqcount_end(&obj->seq); 330 preempt_enable(); 331 332 /* inplace update, no shared fences */ 333 while (i--) 334 dma_fence_put(rcu_dereference_protected(old->shared[i], 335 dma_resv_held(obj))); 336 337 dma_fence_put(old_fence); 338 } 339 EXPORT_SYMBOL(dma_resv_add_excl_fence); 340 341 /** 342 * dma_resv_copy_fences - Copy all fences from src to dst. 343 * @dst: the destination reservation object 344 * @src: the source reservation object 345 * 346 * Copy all fences from src to dst. dst-lock must be held. 347 */ 348 int dma_resv_copy_fences(struct dma_resv *dst, struct dma_resv *src) 349 { 350 struct dma_resv_list *src_list, *dst_list; 351 struct dma_fence *old, *new; 352 unsigned i; 353 354 dma_resv_assert_held(dst); 355 356 rcu_read_lock(); 357 src_list = rcu_dereference(src->fence); 358 359 retry: 360 if (src_list) { 361 unsigned shared_count = src_list->shared_count; 362 363 rcu_read_unlock(); 364 365 dst_list = dma_resv_list_alloc(shared_count); 366 if (!dst_list) 367 return -ENOMEM; 368 369 rcu_read_lock(); 370 src_list = rcu_dereference(src->fence); 371 if (!src_list || src_list->shared_count > shared_count) { 372 kfree(dst_list); 373 goto retry; 374 } 375 376 dst_list->shared_count = 0; 377 for (i = 0; i < src_list->shared_count; ++i) { 378 struct dma_fence *fence; 379 380 fence = rcu_dereference(src_list->shared[i]); 381 if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, 382 &fence->flags)) 383 continue; 384 385 if (!dma_fence_get_rcu(fence)) { 386 dma_resv_list_free(dst_list); 387 src_list = rcu_dereference(src->fence); 388 goto retry; 389 } 390 391 if (dma_fence_is_signaled(fence)) { 392 dma_fence_put(fence); 393 continue; 394 } 395 396 rcu_assign_pointer(dst_list->shared[dst_list->shared_count++], fence); 397 } 398 } else { 399 dst_list = NULL; 400 } 401 402 new = dma_fence_get_rcu_safe(&src->fence_excl); 403 rcu_read_unlock(); 404 405 src_list = dma_resv_get_list(dst); 406 old = dma_resv_get_excl(dst); 407 408 preempt_disable(); 409 write_seqcount_begin(&dst->seq); 410 /* write_seqcount_begin provides the necessary memory barrier */ 411 RCU_INIT_POINTER(dst->fence_excl, new); 412 RCU_INIT_POINTER(dst->fence, dst_list); 413 write_seqcount_end(&dst->seq); 414 preempt_enable(); 415 416 dma_resv_list_free(src_list); 417 dma_fence_put(old); 418 419 return 0; 420 } 421 EXPORT_SYMBOL(dma_resv_copy_fences); 422 423 /** 424 * dma_resv_get_fences_rcu - Get an object's shared and exclusive 425 * fences without update side lock held 426 * @obj: the reservation object 427 * @pfence_excl: the returned exclusive fence (or NULL) 428 * @pshared_count: the number of shared fences returned 429 * @pshared: the array of shared fence ptrs returned (array is krealloc'd to 430 * the required size, and must be freed by caller) 431 * 432 * Retrieve all fences from the reservation object. If the pointer for the 433 * exclusive fence is not specified the fence is put into the array of the 434 * shared fences as well. Returns either zero or -ENOMEM. 435 */ 436 int dma_resv_get_fences_rcu(struct dma_resv *obj, 437 struct dma_fence **pfence_excl, 438 unsigned *pshared_count, 439 struct dma_fence ***pshared) 440 { 441 struct dma_fence **shared = NULL; 442 struct dma_fence *fence_excl; 443 unsigned int shared_count; 444 int ret = 1; 445 446 do { 447 struct dma_resv_list *fobj; 448 unsigned int i, seq; 449 size_t sz = 0; 450 451 shared_count = i = 0; 452 453 rcu_read_lock(); 454 seq = read_seqcount_begin(&obj->seq); 455 456 fence_excl = rcu_dereference(obj->fence_excl); 457 if (fence_excl && !dma_fence_get_rcu(fence_excl)) 458 goto unlock; 459 460 fobj = rcu_dereference(obj->fence); 461 if (fobj) 462 sz += sizeof(*shared) * fobj->shared_max; 463 464 if (!pfence_excl && fence_excl) 465 sz += sizeof(*shared); 466 467 if (sz) { 468 struct dma_fence **nshared; 469 470 #ifdef __linux__ 471 nshared = krealloc(shared, sz, 472 GFP_NOWAIT | __GFP_NOWARN); 473 #else 474 nshared = kmalloc(sz, GFP_NOWAIT | __GFP_NOWARN); 475 if (nshared != NULL && shared != NULL) 476 memcpy(nshared, shared, sz); 477 kfree(shared); 478 #endif 479 if (!nshared) { 480 rcu_read_unlock(); 481 482 dma_fence_put(fence_excl); 483 fence_excl = NULL; 484 485 #ifdef __linux__ 486 nshared = krealloc(shared, sz, GFP_KERNEL); 487 #else 488 nshared = kmalloc(sz, GFP_KERNEL); 489 if (nshared != NULL && shared != NULL) 490 memcpy(nshared, shared, sz); 491 kfree(shared); 492 #endif 493 if (nshared) { 494 shared = nshared; 495 continue; 496 } 497 498 ret = -ENOMEM; 499 break; 500 } 501 shared = nshared; 502 shared_count = fobj ? fobj->shared_count : 0; 503 for (i = 0; i < shared_count; ++i) { 504 shared[i] = rcu_dereference(fobj->shared[i]); 505 if (!dma_fence_get_rcu(shared[i])) 506 break; 507 } 508 } 509 510 if (i != shared_count || read_seqcount_retry(&obj->seq, seq)) { 511 while (i--) 512 dma_fence_put(shared[i]); 513 dma_fence_put(fence_excl); 514 goto unlock; 515 } 516 517 ret = 0; 518 unlock: 519 rcu_read_unlock(); 520 } while (ret); 521 522 if (pfence_excl) 523 *pfence_excl = fence_excl; 524 else if (fence_excl) 525 shared[shared_count++] = fence_excl; 526 527 if (!shared_count) { 528 kfree(shared); 529 shared = NULL; 530 } 531 532 *pshared_count = shared_count; 533 *pshared = shared; 534 return ret; 535 } 536 EXPORT_SYMBOL_GPL(dma_resv_get_fences_rcu); 537 538 /** 539 * dma_resv_wait_timeout_rcu - Wait on reservation's objects 540 * shared and/or exclusive fences. 541 * @obj: the reservation object 542 * @wait_all: if true, wait on all fences, else wait on just exclusive fence 543 * @intr: if true, do interruptible wait 544 * @timeout: timeout value in jiffies or zero to return immediately 545 * 546 * RETURNS 547 * Returns -ERESTARTSYS if interrupted, 0 if the wait timed out, or 548 * greater than zer on success. 549 */ 550 long dma_resv_wait_timeout_rcu(struct dma_resv *obj, 551 bool wait_all, bool intr, 552 unsigned long timeout) 553 { 554 struct dma_fence *fence; 555 unsigned seq, shared_count; 556 long ret = timeout ? timeout : 1; 557 int i; 558 559 retry: 560 shared_count = 0; 561 seq = read_seqcount_begin(&obj->seq); 562 rcu_read_lock(); 563 i = -1; 564 565 fence = rcu_dereference(obj->fence_excl); 566 if (fence && !test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags)) { 567 if (!dma_fence_get_rcu(fence)) 568 goto unlock_retry; 569 570 if (dma_fence_is_signaled(fence)) { 571 dma_fence_put(fence); 572 fence = NULL; 573 } 574 575 } else { 576 fence = NULL; 577 } 578 579 if (wait_all) { 580 struct dma_resv_list *fobj = rcu_dereference(obj->fence); 581 582 if (fobj) 583 shared_count = fobj->shared_count; 584 585 for (i = 0; !fence && i < shared_count; ++i) { 586 struct dma_fence *lfence = rcu_dereference(fobj->shared[i]); 587 588 if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, 589 &lfence->flags)) 590 continue; 591 592 if (!dma_fence_get_rcu(lfence)) 593 goto unlock_retry; 594 595 if (dma_fence_is_signaled(lfence)) { 596 dma_fence_put(lfence); 597 continue; 598 } 599 600 fence = lfence; 601 break; 602 } 603 } 604 605 rcu_read_unlock(); 606 if (fence) { 607 if (read_seqcount_retry(&obj->seq, seq)) { 608 dma_fence_put(fence); 609 goto retry; 610 } 611 612 ret = dma_fence_wait_timeout(fence, intr, ret); 613 dma_fence_put(fence); 614 if (ret > 0 && wait_all && (i + 1 < shared_count)) 615 goto retry; 616 } 617 return ret; 618 619 unlock_retry: 620 rcu_read_unlock(); 621 goto retry; 622 } 623 EXPORT_SYMBOL_GPL(dma_resv_wait_timeout_rcu); 624 625 626 static inline int dma_resv_test_signaled_single(struct dma_fence *passed_fence) 627 { 628 struct dma_fence *fence, *lfence = passed_fence; 629 int ret = 1; 630 631 if (!test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &lfence->flags)) { 632 fence = dma_fence_get_rcu(lfence); 633 if (!fence) 634 return -1; 635 636 ret = !!dma_fence_is_signaled(fence); 637 dma_fence_put(fence); 638 } 639 return ret; 640 } 641 642 /** 643 * dma_resv_test_signaled_rcu - Test if a reservation object's 644 * fences have been signaled. 645 * @obj: the reservation object 646 * @test_all: if true, test all fences, otherwise only test the exclusive 647 * fence 648 * 649 * RETURNS 650 * true if all fences signaled, else false 651 */ 652 bool dma_resv_test_signaled_rcu(struct dma_resv *obj, bool test_all) 653 { 654 unsigned seq, shared_count; 655 int ret; 656 657 rcu_read_lock(); 658 retry: 659 ret = true; 660 shared_count = 0; 661 seq = read_seqcount_begin(&obj->seq); 662 663 if (test_all) { 664 unsigned i; 665 666 struct dma_resv_list *fobj = rcu_dereference(obj->fence); 667 668 if (fobj) 669 shared_count = fobj->shared_count; 670 671 for (i = 0; i < shared_count; ++i) { 672 struct dma_fence *fence = rcu_dereference(fobj->shared[i]); 673 674 ret = dma_resv_test_signaled_single(fence); 675 if (ret < 0) 676 goto retry; 677 else if (!ret) 678 break; 679 } 680 681 if (read_seqcount_retry(&obj->seq, seq)) 682 goto retry; 683 } 684 685 if (!shared_count) { 686 struct dma_fence *fence_excl = rcu_dereference(obj->fence_excl); 687 688 if (fence_excl) { 689 ret = dma_resv_test_signaled_single(fence_excl); 690 if (ret < 0) 691 goto retry; 692 693 if (read_seqcount_retry(&obj->seq, seq)) 694 goto retry; 695 } 696 } 697 698 rcu_read_unlock(); 699 return ret; 700 } 701 EXPORT_SYMBOL_GPL(dma_resv_test_signaled_rcu); 702