1 /**************************************************************************
2  *
3  * Copyright 2007-2010 VMware, Inc.
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 
28 /**
29  * \file
30  * Implementation of fenced buffers.
31  *
32  * \author Jose Fonseca <jfonseca-at-vmware-dot-com>
33  * \author Thomas Hellström <thellstrom-at-vmware-dot-com>
34  */
35 
36 
37 #include "pipe/p_config.h"
38 
39 #if defined(PIPE_OS_LINUX) || defined(PIPE_OS_BSD) || defined(PIPE_OS_SOLARIS)
40 #include <unistd.h>
41 #include <sched.h>
42 #endif
43 #include <inttypes.h>
44 
45 #include "pipe/p_compiler.h"
46 #include "pipe/p_defines.h"
47 #include "util/u_debug.h"
48 #include "os/os_thread.h"
49 #include "util/u_memory.h"
50 #include "util/list.h"
51 
52 #include "pb_buffer.h"
53 #include "pb_buffer_fenced.h"
54 #include "pb_bufmgr.h"
55 
56 
57 
58 /**
59  * Convenience macro (type safe).
60  */
61 #define SUPER(__derived) (&(__derived)->base)
62 
63 
64 struct fenced_manager
65 {
66    struct pb_manager base;
67    struct pb_manager *provider;
68    struct pb_fence_ops *ops;
69 
70    /**
71     * Maximum buffer size that can be safely allocated.
72     */
73    pb_size max_buffer_size;
74 
75    /**
76     * Maximum cpu memory we can allocate before we start waiting for the
77     * GPU to idle.
78     */
79    pb_size max_cpu_total_size;
80 
81    /**
82     * Following members are mutable and protected by this mutex.
83     */
84    mtx_t mutex;
85 
86    /**
87     * Fenced buffer list.
88     *
89     * All fenced buffers are placed in this listed, ordered from the oldest
90     * fence to the newest fence.
91     */
92    struct list_head fenced;
93    pb_size num_fenced;
94 
95    struct list_head unfenced;
96    pb_size num_unfenced;
97 
98    /**
99     * How much temporary CPU memory is being used to hold unvalidated buffers.
100     */
101    pb_size cpu_total_size;
102 };
103 
104 
105 /**
106  * Fenced buffer.
107  *
108  * Wrapper around a pipe buffer which adds fencing and reference counting.
109  */
110 struct fenced_buffer
111 {
112    /**
113     * Immutable members.
114     */
115 
116    struct pb_buffer base;
117    struct fenced_manager *mgr;
118 
119    /**
120     * Following members are mutable and protected by fenced_manager::mutex.
121     */
122 
123    struct list_head head;
124 
125    /**
126     * Buffer with storage.
127     */
128    struct pb_buffer *buffer;
129    pb_size size;
130    struct pb_desc desc;
131 
132    /**
133     * Temporary CPU storage data. Used when there isn't enough GPU memory to
134     * store the buffer.
135     */
136    void *data;
137 
138    /**
139     * A bitmask of PB_USAGE_CPU/GPU_READ/WRITE describing the current
140     * buffer usage.
141     */
142    unsigned flags;
143 
144    unsigned mapcount;
145 
146    struct pb_validate *vl;
147    unsigned validation_flags;
148 
149    struct pipe_fence_handle *fence;
150 };
151 
152 
153 static inline struct fenced_manager *
fenced_manager(struct pb_manager * mgr)154 fenced_manager(struct pb_manager *mgr)
155 {
156    assert(mgr);
157    return (struct fenced_manager *)mgr;
158 }
159 
160 
161 static inline struct fenced_buffer *
fenced_buffer(struct pb_buffer * buf)162 fenced_buffer(struct pb_buffer *buf)
163 {
164    assert(buf);
165    return (struct fenced_buffer *)buf;
166 }
167 
168 
169 static void
170 fenced_buffer_destroy_cpu_storage_locked(struct fenced_buffer *fenced_buf);
171 
172 static enum pipe_error
173 fenced_buffer_create_cpu_storage_locked(struct fenced_manager *fenced_mgr,
174                                         struct fenced_buffer *fenced_buf);
175 
176 static void
177 fenced_buffer_destroy_gpu_storage_locked(struct fenced_buffer *fenced_buf);
178 
179 static enum pipe_error
180 fenced_buffer_create_gpu_storage_locked(struct fenced_manager *fenced_mgr,
181                                         struct fenced_buffer *fenced_buf,
182                                         boolean wait);
183 
184 static enum pipe_error
185 fenced_buffer_copy_storage_to_gpu_locked(struct fenced_buffer *fenced_buf);
186 
187 static enum pipe_error
188 fenced_buffer_copy_storage_to_cpu_locked(struct fenced_buffer *fenced_buf);
189 
190 
191 /**
192  * Dump the fenced buffer list.
193  *
194  * Useful to understand failures to allocate buffers.
195  */
196 static void
fenced_manager_dump_locked(struct fenced_manager * fenced_mgr)197 fenced_manager_dump_locked(struct fenced_manager *fenced_mgr)
198 {
199 #ifdef DEBUG
200    struct pb_fence_ops *ops = fenced_mgr->ops;
201    struct list_head *curr, *next;
202    struct fenced_buffer *fenced_buf;
203 
204    debug_printf("%10s %7s %8s %7s %10s %s\n",
205                 "buffer", "size", "refcount", "storage", "fence", "signalled");
206 
207    curr = fenced_mgr->unfenced.next;
208    next = curr->next;
209    while (curr != &fenced_mgr->unfenced) {
210       fenced_buf = LIST_ENTRY(struct fenced_buffer, curr, head);
211       assert(!fenced_buf->fence);
212       debug_printf("%10p %"PRIu64" %8u %7s\n",
213                    (void *) fenced_buf,
214                    fenced_buf->base.size,
215                    p_atomic_read(&fenced_buf->base.reference.count),
216                    fenced_buf->buffer ? "gpu" : (fenced_buf->data ? "cpu" : "none"));
217       curr = next;
218       next = curr->next;
219    }
220 
221    curr = fenced_mgr->fenced.next;
222    next = curr->next;
223    while (curr != &fenced_mgr->fenced) {
224       int signaled;
225       fenced_buf = LIST_ENTRY(struct fenced_buffer, curr, head);
226       assert(fenced_buf->buffer);
227       signaled = ops->fence_signalled(ops, fenced_buf->fence, 0);
228       debug_printf("%10p %"PRIu64" %8u %7s %10p %s\n",
229                    (void *) fenced_buf,
230                    fenced_buf->base.size,
231                    p_atomic_read(&fenced_buf->base.reference.count),
232                    "gpu",
233                    (void *) fenced_buf->fence,
234                    signaled == 0 ? "y" : "n");
235       curr = next;
236       next = curr->next;
237    }
238 #else
239    (void)fenced_mgr;
240 #endif
241 }
242 
243 
244 static inline void
fenced_buffer_destroy_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)245 fenced_buffer_destroy_locked(struct fenced_manager *fenced_mgr,
246                              struct fenced_buffer *fenced_buf)
247 {
248    assert(!pipe_is_referenced(&fenced_buf->base.reference));
249 
250    assert(!fenced_buf->fence);
251    assert(fenced_buf->head.prev);
252    assert(fenced_buf->head.next);
253    LIST_DEL(&fenced_buf->head);
254    assert(fenced_mgr->num_unfenced);
255    --fenced_mgr->num_unfenced;
256 
257    fenced_buffer_destroy_gpu_storage_locked(fenced_buf);
258    fenced_buffer_destroy_cpu_storage_locked(fenced_buf);
259 
260    FREE(fenced_buf);
261 }
262 
263 
264 /**
265  * Add the buffer to the fenced list.
266  *
267  * Reference count should be incremented before calling this function.
268  */
269 static inline void
fenced_buffer_add_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)270 fenced_buffer_add_locked(struct fenced_manager *fenced_mgr,
271                          struct fenced_buffer *fenced_buf)
272 {
273    assert(pipe_is_referenced(&fenced_buf->base.reference));
274    assert(fenced_buf->flags & PB_USAGE_GPU_READ_WRITE);
275    assert(fenced_buf->fence);
276 
277    p_atomic_inc(&fenced_buf->base.reference.count);
278 
279    LIST_DEL(&fenced_buf->head);
280    assert(fenced_mgr->num_unfenced);
281    --fenced_mgr->num_unfenced;
282    LIST_ADDTAIL(&fenced_buf->head, &fenced_mgr->fenced);
283    ++fenced_mgr->num_fenced;
284 }
285 
286 
287 /**
288  * Remove the buffer from the fenced list, and potentially destroy the buffer
289  * if the reference count reaches zero.
290  *
291  * Returns TRUE if the buffer was detroyed.
292  */
293 static inline boolean
fenced_buffer_remove_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)294 fenced_buffer_remove_locked(struct fenced_manager *fenced_mgr,
295                             struct fenced_buffer *fenced_buf)
296 {
297    struct pb_fence_ops *ops = fenced_mgr->ops;
298 
299    assert(fenced_buf->fence);
300    assert(fenced_buf->mgr == fenced_mgr);
301 
302    ops->fence_reference(ops, &fenced_buf->fence, NULL);
303    fenced_buf->flags &= ~PB_USAGE_GPU_READ_WRITE;
304 
305    assert(fenced_buf->head.prev);
306    assert(fenced_buf->head.next);
307 
308    LIST_DEL(&fenced_buf->head);
309    assert(fenced_mgr->num_fenced);
310    --fenced_mgr->num_fenced;
311 
312    LIST_ADDTAIL(&fenced_buf->head, &fenced_mgr->unfenced);
313    ++fenced_mgr->num_unfenced;
314 
315    if (p_atomic_dec_zero(&fenced_buf->base.reference.count)) {
316       fenced_buffer_destroy_locked(fenced_mgr, fenced_buf);
317       return TRUE;
318    }
319 
320    return FALSE;
321 }
322 
323 
324 /**
325  * Wait for the fence to expire, and remove it from the fenced list.
326  *
327  * This function will release and re-acquire the mutex, so any copy of mutable
328  * state must be discarded after calling it.
329  */
330 static inline enum pipe_error
fenced_buffer_finish_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)331 fenced_buffer_finish_locked(struct fenced_manager *fenced_mgr,
332                             struct fenced_buffer *fenced_buf)
333 {
334    struct pb_fence_ops *ops = fenced_mgr->ops;
335    enum pipe_error ret = PIPE_ERROR;
336 
337 #if 0
338    debug_warning("waiting for GPU");
339 #endif
340 
341    assert(pipe_is_referenced(&fenced_buf->base.reference));
342    assert(fenced_buf->fence);
343 
344    if (fenced_buf->fence) {
345       struct pipe_fence_handle *fence = NULL;
346       int finished;
347       boolean proceed;
348 
349       ops->fence_reference(ops, &fence, fenced_buf->fence);
350 
351       mtx_unlock(&fenced_mgr->mutex);
352 
353       finished = ops->fence_finish(ops, fenced_buf->fence, 0);
354 
355       mtx_lock(&fenced_mgr->mutex);
356 
357       assert(pipe_is_referenced(&fenced_buf->base.reference));
358 
359       /* Only proceed if the fence object didn't change in the meanwhile.
360        * Otherwise assume the work has been already carried out by another
361        * thread that re-aquired the lock before us.
362        */
363       proceed = fence == fenced_buf->fence ? TRUE : FALSE;
364 
365       ops->fence_reference(ops, &fence, NULL);
366 
367       if (proceed && finished == 0) {
368          /* Remove from the fenced list. */
369          boolean destroyed = fenced_buffer_remove_locked(fenced_mgr, fenced_buf);
370 
371          /* TODO: remove consequents buffers with the same fence? */
372 
373          assert(!destroyed);
374          (void) destroyed; /* silence unused var warning for non-debug build */
375 
376          fenced_buf->flags &= ~PB_USAGE_GPU_READ_WRITE;
377 
378          ret = PIPE_OK;
379       }
380    }
381 
382    return ret;
383 }
384 
385 
386 /**
387  * Remove as many fenced buffers from the fenced list as possible.
388  *
389  * Returns TRUE if at least one buffer was removed.
390  */
391 static boolean
fenced_manager_check_signalled_locked(struct fenced_manager * fenced_mgr,boolean wait)392 fenced_manager_check_signalled_locked(struct fenced_manager *fenced_mgr,
393                                       boolean wait)
394 {
395    struct pb_fence_ops *ops = fenced_mgr->ops;
396    struct list_head *curr, *next;
397    struct fenced_buffer *fenced_buf;
398    struct pipe_fence_handle *prev_fence = NULL;
399    boolean ret = FALSE;
400 
401    curr = fenced_mgr->fenced.next;
402    next = curr->next;
403    while (curr != &fenced_mgr->fenced) {
404       fenced_buf = LIST_ENTRY(struct fenced_buffer, curr, head);
405 
406       if (fenced_buf->fence != prev_fence) {
407          int signaled;
408 
409          if (wait) {
410             signaled = ops->fence_finish(ops, fenced_buf->fence, 0);
411 
412             /* Don't return just now. Instead preemptively check if the
413              * following buffers' fences already expired, without further waits.
414              */
415             wait = FALSE;
416          } else {
417             signaled = ops->fence_signalled(ops, fenced_buf->fence, 0);
418          }
419 
420          if (signaled != 0) {
421             return ret;
422          }
423 
424          prev_fence = fenced_buf->fence;
425       } else {
426          /* This buffer's fence object is identical to the previous buffer's
427           * fence object, so no need to check the fence again.
428           */
429          assert(ops->fence_signalled(ops, fenced_buf->fence, 0) == 0);
430       }
431 
432       fenced_buffer_remove_locked(fenced_mgr, fenced_buf);
433 
434       ret = TRUE;
435 
436       curr = next;
437       next = curr->next;
438    }
439 
440    return ret;
441 }
442 
443 
444 /**
445  * Try to free some GPU memory by backing it up into CPU memory.
446  *
447  * Returns TRUE if at least one buffer was freed.
448  */
449 static boolean
fenced_manager_free_gpu_storage_locked(struct fenced_manager * fenced_mgr)450 fenced_manager_free_gpu_storage_locked(struct fenced_manager *fenced_mgr)
451 {
452    struct list_head *curr, *next;
453    struct fenced_buffer *fenced_buf;
454 
455    curr = fenced_mgr->unfenced.next;
456    next = curr->next;
457    while (curr != &fenced_mgr->unfenced) {
458       fenced_buf = LIST_ENTRY(struct fenced_buffer, curr, head);
459 
460       /* We can only move storage if the buffer is not mapped and not
461        * validated.
462        */
463       if (fenced_buf->buffer &&
464          !fenced_buf->mapcount &&
465          !fenced_buf->vl) {
466          enum pipe_error ret;
467 
468          ret = fenced_buffer_create_cpu_storage_locked(fenced_mgr, fenced_buf);
469          if (ret == PIPE_OK) {
470             ret = fenced_buffer_copy_storage_to_cpu_locked(fenced_buf);
471             if (ret == PIPE_OK) {
472                fenced_buffer_destroy_gpu_storage_locked(fenced_buf);
473                return TRUE;
474             }
475             fenced_buffer_destroy_cpu_storage_locked(fenced_buf);
476          }
477       }
478 
479       curr = next;
480       next = curr->next;
481    }
482 
483    return FALSE;
484 }
485 
486 
487 /**
488  * Destroy CPU storage for this buffer.
489  */
490 static void
fenced_buffer_destroy_cpu_storage_locked(struct fenced_buffer * fenced_buf)491 fenced_buffer_destroy_cpu_storage_locked(struct fenced_buffer *fenced_buf)
492 {
493    if (fenced_buf->data) {
494       align_free(fenced_buf->data);
495       fenced_buf->data = NULL;
496       assert(fenced_buf->mgr->cpu_total_size >= fenced_buf->size);
497       fenced_buf->mgr->cpu_total_size -= fenced_buf->size;
498    }
499 }
500 
501 
502 /**
503  * Create CPU storage for this buffer.
504  */
505 static enum pipe_error
fenced_buffer_create_cpu_storage_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)506 fenced_buffer_create_cpu_storage_locked(struct fenced_manager *fenced_mgr,
507                                         struct fenced_buffer *fenced_buf)
508 {
509    assert(!fenced_buf->data);
510    if (fenced_buf->data)
511       return PIPE_OK;
512 
513    if (fenced_mgr->cpu_total_size + fenced_buf->size > fenced_mgr->max_cpu_total_size)
514       return PIPE_ERROR_OUT_OF_MEMORY;
515 
516    fenced_buf->data = align_malloc(fenced_buf->size, fenced_buf->desc.alignment);
517    if (!fenced_buf->data)
518       return PIPE_ERROR_OUT_OF_MEMORY;
519 
520    fenced_mgr->cpu_total_size += fenced_buf->size;
521 
522    return PIPE_OK;
523 }
524 
525 
526 /**
527  * Destroy the GPU storage.
528  */
529 static void
fenced_buffer_destroy_gpu_storage_locked(struct fenced_buffer * fenced_buf)530 fenced_buffer_destroy_gpu_storage_locked(struct fenced_buffer *fenced_buf)
531 {
532    if (fenced_buf->buffer) {
533       pb_reference(&fenced_buf->buffer, NULL);
534    }
535 }
536 
537 
538 /**
539  * Try to create GPU storage for this buffer.
540  *
541  * This function is a shorthand around pb_manager::create_buffer for
542  * fenced_buffer_create_gpu_storage_locked()'s benefit.
543  */
544 static inline boolean
fenced_buffer_try_create_gpu_storage_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf)545 fenced_buffer_try_create_gpu_storage_locked(struct fenced_manager *fenced_mgr,
546                                             struct fenced_buffer *fenced_buf)
547 {
548    struct pb_manager *provider = fenced_mgr->provider;
549 
550    assert(!fenced_buf->buffer);
551 
552    fenced_buf->buffer = provider->create_buffer(fenced_mgr->provider,
553                                                 fenced_buf->size,
554                                                 &fenced_buf->desc);
555    return fenced_buf->buffer ? TRUE : FALSE;
556 }
557 
558 
559 /**
560  * Create GPU storage for this buffer.
561  */
562 static enum pipe_error
fenced_buffer_create_gpu_storage_locked(struct fenced_manager * fenced_mgr,struct fenced_buffer * fenced_buf,boolean wait)563 fenced_buffer_create_gpu_storage_locked(struct fenced_manager *fenced_mgr,
564                                         struct fenced_buffer *fenced_buf,
565                                         boolean wait)
566 {
567    assert(!fenced_buf->buffer);
568 
569    /* Check for signaled buffers before trying to allocate. */
570    fenced_manager_check_signalled_locked(fenced_mgr, FALSE);
571 
572    fenced_buffer_try_create_gpu_storage_locked(fenced_mgr, fenced_buf);
573 
574    /* Keep trying while there is some sort of progress:
575     * - fences are expiring,
576     * - or buffers are being being swapped out from GPU memory into CPU memory.
577     */
578    while (!fenced_buf->buffer &&
579          (fenced_manager_check_signalled_locked(fenced_mgr, FALSE) ||
580           fenced_manager_free_gpu_storage_locked(fenced_mgr))) {
581       fenced_buffer_try_create_gpu_storage_locked(fenced_mgr, fenced_buf);
582    }
583 
584    if (!fenced_buf->buffer && wait) {
585       /* Same as before, but this time around, wait to free buffers if
586        * necessary.
587        */
588       while (!fenced_buf->buffer &&
589             (fenced_manager_check_signalled_locked(fenced_mgr, TRUE) ||
590              fenced_manager_free_gpu_storage_locked(fenced_mgr))) {
591          fenced_buffer_try_create_gpu_storage_locked(fenced_mgr, fenced_buf);
592       }
593    }
594 
595    if (!fenced_buf->buffer) {
596       if (0)
597          fenced_manager_dump_locked(fenced_mgr);
598 
599       /* Give up. */
600       return PIPE_ERROR_OUT_OF_MEMORY;
601    }
602 
603    return PIPE_OK;
604 }
605 
606 
607 static enum pipe_error
fenced_buffer_copy_storage_to_gpu_locked(struct fenced_buffer * fenced_buf)608 fenced_buffer_copy_storage_to_gpu_locked(struct fenced_buffer *fenced_buf)
609 {
610    uint8_t *map;
611 
612    assert(fenced_buf->data);
613    assert(fenced_buf->buffer);
614 
615    map = pb_map(fenced_buf->buffer, PB_USAGE_CPU_WRITE, NULL);
616    if (!map)
617       return PIPE_ERROR;
618 
619    memcpy(map, fenced_buf->data, fenced_buf->size);
620 
621    pb_unmap(fenced_buf->buffer);
622 
623    return PIPE_OK;
624 }
625 
626 
627 static enum pipe_error
fenced_buffer_copy_storage_to_cpu_locked(struct fenced_buffer * fenced_buf)628 fenced_buffer_copy_storage_to_cpu_locked(struct fenced_buffer *fenced_buf)
629 {
630    const uint8_t *map;
631 
632    assert(fenced_buf->data);
633    assert(fenced_buf->buffer);
634 
635    map = pb_map(fenced_buf->buffer, PB_USAGE_CPU_READ, NULL);
636    if (!map)
637       return PIPE_ERROR;
638 
639    memcpy(fenced_buf->data, map, fenced_buf->size);
640 
641    pb_unmap(fenced_buf->buffer);
642 
643    return PIPE_OK;
644 }
645 
646 
647 static void
fenced_buffer_destroy(struct pb_buffer * buf)648 fenced_buffer_destroy(struct pb_buffer *buf)
649 {
650    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
651    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
652 
653    assert(!pipe_is_referenced(&fenced_buf->base.reference));
654 
655    mtx_lock(&fenced_mgr->mutex);
656 
657    fenced_buffer_destroy_locked(fenced_mgr, fenced_buf);
658 
659    mtx_unlock(&fenced_mgr->mutex);
660 }
661 
662 
663 static void *
fenced_buffer_map(struct pb_buffer * buf,unsigned flags,void * flush_ctx)664 fenced_buffer_map(struct pb_buffer *buf,
665                   unsigned flags, void *flush_ctx)
666 {
667    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
668    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
669    struct pb_fence_ops *ops = fenced_mgr->ops;
670    void *map = NULL;
671 
672    mtx_lock(&fenced_mgr->mutex);
673 
674    assert(!(flags & PB_USAGE_GPU_READ_WRITE));
675 
676    /* Serialize writes. */
677    while ((fenced_buf->flags & PB_USAGE_GPU_WRITE) ||
678          ((fenced_buf->flags & PB_USAGE_GPU_READ) &&
679           (flags & PB_USAGE_CPU_WRITE))) {
680 
681       /* Don't wait for the GPU to finish accessing it,
682        * if blocking is forbidden.
683        */
684       if ((flags & PB_USAGE_DONTBLOCK) &&
685          ops->fence_signalled(ops, fenced_buf->fence, 0) != 0) {
686          goto done;
687       }
688 
689       if (flags & PB_USAGE_UNSYNCHRONIZED) {
690          break;
691       }
692 
693       /* Wait for the GPU to finish accessing. This will release and re-acquire
694        * the mutex, so all copies of mutable state must be discarded.
695        */
696       fenced_buffer_finish_locked(fenced_mgr, fenced_buf);
697    }
698 
699    if (fenced_buf->buffer) {
700       map = pb_map(fenced_buf->buffer, flags, flush_ctx);
701    } else {
702       assert(fenced_buf->data);
703       map = fenced_buf->data;
704    }
705 
706    if (map) {
707       ++fenced_buf->mapcount;
708       fenced_buf->flags |= flags & PB_USAGE_CPU_READ_WRITE;
709    }
710 
711  done:
712    mtx_unlock(&fenced_mgr->mutex);
713 
714    return map;
715 }
716 
717 
718 static void
fenced_buffer_unmap(struct pb_buffer * buf)719 fenced_buffer_unmap(struct pb_buffer *buf)
720 {
721    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
722    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
723 
724    mtx_lock(&fenced_mgr->mutex);
725 
726    assert(fenced_buf->mapcount);
727    if (fenced_buf->mapcount) {
728       if (fenced_buf->buffer)
729          pb_unmap(fenced_buf->buffer);
730       --fenced_buf->mapcount;
731       if (!fenced_buf->mapcount)
732          fenced_buf->flags &= ~PB_USAGE_CPU_READ_WRITE;
733    }
734 
735    mtx_unlock(&fenced_mgr->mutex);
736 }
737 
738 
739 static enum pipe_error
fenced_buffer_validate(struct pb_buffer * buf,struct pb_validate * vl,unsigned flags)740 fenced_buffer_validate(struct pb_buffer *buf,
741                        struct pb_validate *vl,
742                        unsigned flags)
743 {
744    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
745    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
746    enum pipe_error ret;
747 
748    mtx_lock(&fenced_mgr->mutex);
749 
750    if (!vl) {
751       /* Invalidate. */
752       fenced_buf->vl = NULL;
753       fenced_buf->validation_flags = 0;
754       ret = PIPE_OK;
755       goto done;
756    }
757 
758    assert(flags & PB_USAGE_GPU_READ_WRITE);
759    assert(!(flags & ~PB_USAGE_GPU_READ_WRITE));
760    flags &= PB_USAGE_GPU_READ_WRITE;
761 
762    /* Buffer cannot be validated in two different lists. */
763    if (fenced_buf->vl && fenced_buf->vl != vl) {
764       ret = PIPE_ERROR_RETRY;
765       goto done;
766    }
767 
768    if (fenced_buf->vl == vl &&
769       (fenced_buf->validation_flags & flags) == flags) {
770       /* Nothing to do -- buffer already validated. */
771       ret = PIPE_OK;
772       goto done;
773    }
774 
775    /* Create and update GPU storage. */
776    if (!fenced_buf->buffer) {
777       assert(!fenced_buf->mapcount);
778 
779       ret = fenced_buffer_create_gpu_storage_locked(fenced_mgr, fenced_buf, TRUE);
780       if (ret != PIPE_OK) {
781          goto done;
782       }
783 
784       ret = fenced_buffer_copy_storage_to_gpu_locked(fenced_buf);
785       if (ret != PIPE_OK) {
786          fenced_buffer_destroy_gpu_storage_locked(fenced_buf);
787          goto done;
788       }
789 
790       if (fenced_buf->mapcount) {
791          debug_printf("warning: validating a buffer while it is still mapped\n");
792       } else {
793          fenced_buffer_destroy_cpu_storage_locked(fenced_buf);
794       }
795    }
796 
797    ret = pb_validate(fenced_buf->buffer, vl, flags);
798    if (ret != PIPE_OK)
799       goto done;
800 
801    fenced_buf->vl = vl;
802    fenced_buf->validation_flags |= flags;
803 
804  done:
805    mtx_unlock(&fenced_mgr->mutex);
806 
807    return ret;
808 }
809 
810 
811 static void
fenced_buffer_fence(struct pb_buffer * buf,struct pipe_fence_handle * fence)812 fenced_buffer_fence(struct pb_buffer *buf,
813                     struct pipe_fence_handle *fence)
814 {
815    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
816    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
817    struct pb_fence_ops *ops = fenced_mgr->ops;
818 
819    mtx_lock(&fenced_mgr->mutex);
820 
821    assert(pipe_is_referenced(&fenced_buf->base.reference));
822    assert(fenced_buf->buffer);
823 
824    if (fence != fenced_buf->fence) {
825       assert(fenced_buf->vl);
826       assert(fenced_buf->validation_flags);
827 
828       if (fenced_buf->fence) {
829          MAYBE_UNUSED boolean destroyed = fenced_buffer_remove_locked(fenced_mgr, fenced_buf);
830          assert(!destroyed);
831       }
832       if (fence) {
833          ops->fence_reference(ops, &fenced_buf->fence, fence);
834          fenced_buf->flags |= fenced_buf->validation_flags;
835          fenced_buffer_add_locked(fenced_mgr, fenced_buf);
836       }
837 
838       pb_fence(fenced_buf->buffer, fence);
839 
840       fenced_buf->vl = NULL;
841       fenced_buf->validation_flags = 0;
842    }
843 
844    mtx_unlock(&fenced_mgr->mutex);
845 }
846 
847 
848 static void
fenced_buffer_get_base_buffer(struct pb_buffer * buf,struct pb_buffer ** base_buf,pb_size * offset)849 fenced_buffer_get_base_buffer(struct pb_buffer *buf,
850                               struct pb_buffer **base_buf,
851                               pb_size *offset)
852 {
853    struct fenced_buffer *fenced_buf = fenced_buffer(buf);
854    struct fenced_manager *fenced_mgr = fenced_buf->mgr;
855 
856    mtx_lock(&fenced_mgr->mutex);
857 
858    /* This should only be called when the buffer is validated. Typically
859     * when processing relocations.
860     */
861    assert(fenced_buf->vl);
862    assert(fenced_buf->buffer);
863 
864    if (fenced_buf->buffer) {
865       pb_get_base_buffer(fenced_buf->buffer, base_buf, offset);
866    } else {
867       *base_buf = buf;
868       *offset = 0;
869    }
870 
871    mtx_unlock(&fenced_mgr->mutex);
872 }
873 
874 
875 static const struct pb_vtbl
876 fenced_buffer_vtbl = {
877    fenced_buffer_destroy,
878    fenced_buffer_map,
879    fenced_buffer_unmap,
880    fenced_buffer_validate,
881    fenced_buffer_fence,
882    fenced_buffer_get_base_buffer
883 };
884 
885 
886 /**
887  * Wrap a buffer in a fenced buffer.
888  */
889 static struct pb_buffer *
fenced_bufmgr_create_buffer(struct pb_manager * mgr,pb_size size,const struct pb_desc * desc)890 fenced_bufmgr_create_buffer(struct pb_manager *mgr,
891                             pb_size size,
892                             const struct pb_desc *desc)
893 {
894    struct fenced_manager *fenced_mgr = fenced_manager(mgr);
895    struct fenced_buffer *fenced_buf;
896    enum pipe_error ret;
897 
898    /* Don't stall the GPU, waste time evicting buffers, or waste memory
899     * trying to create a buffer that will most likely never fit into the
900     * graphics aperture.
901     */
902    if (size > fenced_mgr->max_buffer_size) {
903       goto no_buffer;
904    }
905 
906    fenced_buf = CALLOC_STRUCT(fenced_buffer);
907    if (!fenced_buf)
908       goto no_buffer;
909 
910    pipe_reference_init(&fenced_buf->base.reference, 1);
911    fenced_buf->base.alignment = desc->alignment;
912    fenced_buf->base.usage = desc->usage;
913    fenced_buf->base.size = size;
914    fenced_buf->size = size;
915    fenced_buf->desc = *desc;
916 
917    fenced_buf->base.vtbl = &fenced_buffer_vtbl;
918    fenced_buf->mgr = fenced_mgr;
919 
920    mtx_lock(&fenced_mgr->mutex);
921 
922    /* Try to create GPU storage without stalling. */
923    ret = fenced_buffer_create_gpu_storage_locked(fenced_mgr, fenced_buf, FALSE);
924 
925    /* Attempt to use CPU memory to avoid stalling the GPU. */
926    if (ret != PIPE_OK) {
927       ret = fenced_buffer_create_cpu_storage_locked(fenced_mgr, fenced_buf);
928    }
929 
930    /* Create GPU storage, waiting for some to be available. */
931    if (ret != PIPE_OK) {
932       ret = fenced_buffer_create_gpu_storage_locked(fenced_mgr, fenced_buf, TRUE);
933    }
934 
935    /* Give up. */
936    if (ret != PIPE_OK) {
937       goto no_storage;
938    }
939 
940    assert(fenced_buf->buffer || fenced_buf->data);
941 
942    LIST_ADDTAIL(&fenced_buf->head, &fenced_mgr->unfenced);
943    ++fenced_mgr->num_unfenced;
944    mtx_unlock(&fenced_mgr->mutex);
945 
946    return &fenced_buf->base;
947 
948  no_storage:
949    mtx_unlock(&fenced_mgr->mutex);
950    FREE(fenced_buf);
951  no_buffer:
952    return NULL;
953 }
954 
955 
956 static void
fenced_bufmgr_flush(struct pb_manager * mgr)957 fenced_bufmgr_flush(struct pb_manager *mgr)
958 {
959    struct fenced_manager *fenced_mgr = fenced_manager(mgr);
960 
961    mtx_lock(&fenced_mgr->mutex);
962    while (fenced_manager_check_signalled_locked(fenced_mgr, TRUE))
963       ;
964    mtx_unlock(&fenced_mgr->mutex);
965 
966    assert(fenced_mgr->provider->flush);
967    if (fenced_mgr->provider->flush)
968       fenced_mgr->provider->flush(fenced_mgr->provider);
969 }
970 
971 
972 static void
fenced_bufmgr_destroy(struct pb_manager * mgr)973 fenced_bufmgr_destroy(struct pb_manager *mgr)
974 {
975    struct fenced_manager *fenced_mgr = fenced_manager(mgr);
976 
977    mtx_lock(&fenced_mgr->mutex);
978 
979    /* Wait on outstanding fences. */
980    while (fenced_mgr->num_fenced) {
981       mtx_unlock(&fenced_mgr->mutex);
982 #if defined(PIPE_OS_LINUX) || defined(PIPE_OS_BSD) || defined(PIPE_OS_SOLARIS)
983       sched_yield();
984 #endif
985       mtx_lock(&fenced_mgr->mutex);
986       while (fenced_manager_check_signalled_locked(fenced_mgr, TRUE))
987          ;
988    }
989 
990 #ifdef DEBUG
991    /* assert(!fenced_mgr->num_unfenced); */
992 #endif
993 
994    mtx_unlock(&fenced_mgr->mutex);
995    mtx_destroy(&fenced_mgr->mutex);
996 
997    if (fenced_mgr->provider)
998       fenced_mgr->provider->destroy(fenced_mgr->provider);
999 
1000    fenced_mgr->ops->destroy(fenced_mgr->ops);
1001 
1002    FREE(fenced_mgr);
1003 }
1004 
1005 
1006 struct pb_manager *
fenced_bufmgr_create(struct pb_manager * provider,struct pb_fence_ops * ops,pb_size max_buffer_size,pb_size max_cpu_total_size)1007 fenced_bufmgr_create(struct pb_manager *provider,
1008                      struct pb_fence_ops *ops,
1009                      pb_size max_buffer_size,
1010                      pb_size max_cpu_total_size)
1011 {
1012    struct fenced_manager *fenced_mgr;
1013 
1014    if (!provider)
1015       return NULL;
1016 
1017    fenced_mgr = CALLOC_STRUCT(fenced_manager);
1018    if (!fenced_mgr)
1019       return NULL;
1020 
1021    fenced_mgr->base.destroy = fenced_bufmgr_destroy;
1022    fenced_mgr->base.create_buffer = fenced_bufmgr_create_buffer;
1023    fenced_mgr->base.flush = fenced_bufmgr_flush;
1024 
1025    fenced_mgr->provider = provider;
1026    fenced_mgr->ops = ops;
1027    fenced_mgr->max_buffer_size = max_buffer_size;
1028    fenced_mgr->max_cpu_total_size = max_cpu_total_size;
1029 
1030    LIST_INITHEAD(&fenced_mgr->fenced);
1031    fenced_mgr->num_fenced = 0;
1032 
1033    LIST_INITHEAD(&fenced_mgr->unfenced);
1034    fenced_mgr->num_unfenced = 0;
1035 
1036    (void) mtx_init(&fenced_mgr->mutex, mtx_plain);
1037 
1038    return &fenced_mgr->base;
1039 }
1040