/**************************************************************************
*
* Copyright 2006-2008 Tungsten Graphics, Inc., Cedar Park, TX., USA
* All Rights Reserved.
* Copyright 2009 VMware, Inc., Palo Alto, CA., USA
* All Rights Reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the
* "Software"), to deal in the Software without restriction, including
* without limitation the rights to use, copy, modify, merge, publish,
* distribute, sub license, and/or sell copies of the Software, and to
* permit persons to whom the Software is furnished to do so, subject to
* the following conditions:
*
* The above copyright notice and this permission notice (including the
* next paragraph) shall be included in all copies or substantial portions
* of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE.
*
**************************************************************************/
/*
* Authors: Thomas Hellstrom <thomas-at-tungstengraphics-dot-com>
*/
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include <drm/psb_ttm_placement_user.h>
#include <stdint.h>
#include <sys/time.h>
#include <errno.h>
#include <unistd.h>
#include <assert.h>
#include <string.h>
#include <sys/mman.h>
#include <xf86drm.h>
#include "wsbm_pool.h"
#include "wsbm_fencemgr.h"
#include "wsbm_priv.h"
#include "wsbm_manager.h"
#define WSBM_SLABPOOL_ALLOC_RETRIES 100
#define DRMRESTARTCOMMANDWRITE(_fd, _val, _arg, _ret) \
do { \
(_ret) = drmCommandWrite(_fd, _val, &(_arg), sizeof(_arg)); \
} while ((_ret) == -EAGAIN || (_ret) == -ERESTART); \
#define DRMRESTARTCOMMANDWRITEREAD(_fd, _val, _arg, _ret) \
do { \
(_ret) = drmCommandWriteRead(_fd, _val, &(_arg), sizeof(_arg)); \
} while ((_ret) == -EAGAIN || (_ret) == -ERESTART); \
#ifdef DEBUG_FENCESIGNALED
static int createbuffer = 0;
static int fencesignaled = 0;
#endif
struct _WsbmSlab;
struct _WsbmSlabBuffer
{
struct _WsbmKernelBuf kBuf;
struct _WsbmBufStorage storage;
struct _WsbmCond event;
/*
* Remains constant after creation.
*/
int isSlabBuffer;
struct _WsbmSlab *parent;
uint32_t start;
void *virtual;
unsigned long requestedSize;
uint64_t mapHandle;
/*
* Protected by struct _WsbmSlabSizeHeader::mutex
*/
struct _WsbmListHead head;
/*
* Protected by this::mutex
*/
struct _WsbmFenceObject *fence;
uint32_t fenceType;
struct _WsbmAtomic writers; /* (Only upping) */
int unFenced;
};
struct _WsbmSlabPool;
struct _WsbmSlabKernelBO
{
/*
* Constant at creation
*/
struct _WsbmKernelBuf kBuf;
uint32_t pageAlignment;
void *virtual;
unsigned long actualSize;
uint64_t mapHandle;
/*
* Protected by struct _WsbmSlabCache::mutex
*/
struct _WsbmSlabPool *slabPool;
uint32_t proposedPlacement;
struct _WsbmListHead timeoutHead;
struct _WsbmListHead head;
struct timeval timeFreed;
};
struct _WsbmSlab
{
struct _WsbmListHead head;
struct _WsbmListHead freeBuffers;
uint32_t numBuffers;
uint32_t numFree;
struct _WsbmSlabBuffer *buffers;
struct _WsbmSlabSizeHeader *header;
struct _WsbmSlabKernelBO *kbo;
};
struct _WsbmSlabSizeHeader
{
/*
* Constant at creation.
*/
struct _WsbmSlabPool *slabPool;
uint32_t bufSize;
/*
* Protected by this::mutex
*/
struct _WsbmListHead slabs;
struct _WsbmListHead freeSlabs;
struct _WsbmListHead delayedBuffers;
uint32_t numDelayed;
struct _WsbmMutex mutex;
};
struct _WsbmSlabCache
{
struct timeval slabTimeout;
struct timeval checkInterval;
struct timeval nextCheck;
struct _WsbmListHead timeoutList;
struct _WsbmListHead unCached;
struct _WsbmListHead cached;
struct _WsbmMutex mutex;
};
struct _WsbmSlabPool
{
struct _WsbmBufferPool pool;
/*
* The data of this structure remains constant after
* initialization and thus needs no mutex protection.
*/
unsigned int devOffset;
struct _WsbmSlabCache *cache;
uint32_t proposedPlacement;
uint32_t validMask;
uint32_t *bucketSizes;
uint32_t numBuckets;
uint32_t pageSize;
int pageAlignment;
int maxSlabSize;
int desiredNumBuffers;
struct _WsbmSlabSizeHeader *headers;
};
static inline struct _WsbmSlabPool *
slabPoolFromPool(struct _WsbmBufferPool *pool)
{
return containerOf(pool, struct _WsbmSlabPool, pool);
}
static inline struct _WsbmSlabPool *
slabPoolFromBuf(struct _WsbmSlabBuffer *sBuf)
{
return slabPoolFromPool(sBuf->storage.pool);
}
static inline struct _WsbmSlabBuffer *
slabBuffer(struct _WsbmBufStorage *buf)
{
return containerOf(buf, struct _WsbmSlabBuffer, storage);
}
/*
* FIXME: Perhaps arrange timeout slabs in size buckets for fast
* retreival??
*/
static inline int
wsbmTimeAfterEq(struct timeval *arg1, struct timeval *arg2)
{
return ((arg1->tv_sec > arg2->tv_sec) ||
((arg1->tv_sec == arg2->tv_sec) &&
(arg1->tv_usec > arg2->tv_usec)));
}
static inline void
wsbmTimeAdd(struct timeval *arg, struct timeval *add)
{
unsigned int sec;
arg->tv_sec += add->tv_sec;
arg->tv_usec += add->tv_usec;
sec = arg->tv_usec / 1000000;
arg->tv_sec += sec;
arg->tv_usec -= sec * 1000000;
}
static void
wsbmFreeKernelBO(struct _WsbmSlabKernelBO *kbo)
{
struct ttm_pl_reference_req arg;
struct _WsbmSlabPool *slabPool;
if (!kbo)
return;
slabPool = kbo->slabPool;
arg.handle = kbo->kBuf.handle;
(void)munmap(kbo->virtual, kbo->actualSize);
(void)drmCommandWrite(slabPool->pool.fd,
slabPool->devOffset + TTM_PL_UNREF, &arg,
sizeof(arg));
free(kbo);
}
static void
wsbmFreeTimeoutKBOsLocked(struct _WsbmSlabCache *cache, struct timeval *time)
{
struct _WsbmListHead *list, *next;
struct _WsbmSlabKernelBO *kbo;
if (!wsbmTimeAfterEq(time, &cache->nextCheck))
return;
WSBMLISTFOREACHSAFE(list, next, &cache->timeoutList) {
kbo = WSBMLISTENTRY(list, struct _WsbmSlabKernelBO, timeoutHead);
if (!wsbmTimeAfterEq(time, &kbo->timeFreed))
break;
WSBMLISTDELINIT(&kbo->timeoutHead);
WSBMLISTDELINIT(&kbo->head);
wsbmFreeKernelBO(kbo);
}
cache->nextCheck = *time;
wsbmTimeAdd(&cache->nextCheck, &cache->checkInterval);
}
/*
* Add a _SlabKernelBO to the free slab manager.
* This means that it is available for reuse, but if it's not
* reused in a while, it will be freed.
*/
static void
wsbmSetKernelBOFree(struct _WsbmSlabCache *cache,
struct _WsbmSlabKernelBO *kbo)
{
struct timeval time;
struct timeval timeFreed;
gettimeofday(&time, NULL);
timeFreed = time;
WSBM_MUTEX_LOCK(&cache->mutex);
wsbmTimeAdd(&timeFreed, &cache->slabTimeout);
kbo->timeFreed = timeFreed;
if (kbo->kBuf.placement & TTM_PL_FLAG_CACHED)
WSBMLISTADD(&kbo->head, &cache->cached);
else
WSBMLISTADD(&kbo->head, &cache->unCached);
WSBMLISTADDTAIL(&kbo->timeoutHead, &cache->timeoutList);
wsbmFreeTimeoutKBOsLocked(cache, &time);
WSBM_MUTEX_UNLOCK(&cache->mutex);
}
/*
* Get a _SlabKernelBO for us to use as storage for a slab.
*/
static struct _WsbmSlabKernelBO *
wsbmAllocKernelBO(struct _WsbmSlabSizeHeader *header)
{
struct _WsbmSlabPool *slabPool = header->slabPool;
struct _WsbmSlabCache *cache = slabPool->cache;
struct _WsbmListHead *list, *head;
uint32_t size = header->bufSize * slabPool->desiredNumBuffers;
struct _WsbmSlabKernelBO *kbo;
struct _WsbmSlabKernelBO *kboTmp;
int ret;
/*
* FIXME: We should perhaps allow some variation in slabsize in order
* to efficiently reuse slabs.
*/
size = (size <= (uint32_t) slabPool->maxSlabSize) ? size : (uint32_t) slabPool->maxSlabSize;
if (size < header->bufSize)
size = header->bufSize;
size = (size + slabPool->pageSize - 1) & ~(slabPool->pageSize - 1);
WSBM_MUTEX_LOCK(&cache->mutex);
kbo = NULL;
retry:
head = (slabPool->proposedPlacement & TTM_PL_FLAG_CACHED) ?
&cache->cached : &cache->unCached;
WSBMLISTFOREACH(list, head) {
kboTmp = WSBMLISTENTRY(list, struct _WsbmSlabKernelBO, head);
if ((kboTmp->actualSize == size) &&
(slabPool->pageAlignment == 0 ||
(kboTmp->pageAlignment % slabPool->pageAlignment) == 0)) {
if (!kbo)
kbo = kboTmp;
if ((kbo->proposedPlacement ^ slabPool->proposedPlacement) == 0)
break;
}
}
if (kbo) {
WSBMLISTDELINIT(&kbo->head);
WSBMLISTDELINIT(&kbo->timeoutHead);
}
WSBM_MUTEX_UNLOCK(&cache->mutex);
if (kbo) {
uint32_t new_mask =
kbo->proposedPlacement ^ slabPool->proposedPlacement;
ret = 0;
if (new_mask) {
union ttm_pl_setstatus_arg arg;
struct ttm_pl_setstatus_req *req = &arg.req;
struct ttm_pl_rep *rep = &arg.rep;
req->handle = kbo->kBuf.handle;
req->set_placement = slabPool->proposedPlacement & new_mask;
req->clr_placement = ~slabPool->proposedPlacement & new_mask;
DRMRESTARTCOMMANDWRITEREAD(slabPool->pool.fd,
slabPool->devOffset + TTM_PL_SETSTATUS,
arg, ret);
if (ret == 0) {
kbo->kBuf.gpuOffset = rep->gpu_offset;
kbo->kBuf.placement = rep->placement;
}
kbo->proposedPlacement = slabPool->proposedPlacement;
}
if (ret == 0)
return kbo;
wsbmFreeKernelBO(kbo);
kbo = NULL;
goto retry;
}
kbo = calloc(1, sizeof(*kbo));
if (!kbo)
return NULL;
{
union ttm_pl_create_arg arg;
kbo->slabPool = slabPool;
WSBMINITLISTHEAD(&kbo->head);
WSBMINITLISTHEAD(&kbo->timeoutHead);
arg.req.size = size;
arg.req.placement = slabPool->proposedPlacement;
arg.req.page_alignment = slabPool->pageAlignment;
DRMRESTARTCOMMANDWRITEREAD(slabPool->pool.fd,
slabPool->devOffset + TTM_PL_CREATE,
arg, ret);
if (ret)
goto out_err0;
kbo->kBuf.gpuOffset = arg.rep.gpu_offset;
kbo->kBuf.placement = arg.rep.placement;
kbo->kBuf.handle = arg.rep.handle;
kbo->actualSize = arg.rep.bo_size;
kbo->mapHandle = arg.rep.map_handle;
kbo->proposedPlacement = slabPool->proposedPlacement;
}
kbo->virtual = mmap(0, kbo->actualSize,
PROT_READ | PROT_WRITE, MAP_SHARED,
slabPool->pool.fd, kbo->mapHandle);
if (kbo->virtual == MAP_FAILED) {
ret = -errno;
goto out_err1;
}
return kbo;
out_err1:
{
struct ttm_pl_reference_req arg = {.handle = kbo->kBuf.handle };
(void)drmCommandWrite(slabPool->pool.fd,
slabPool->devOffset + TTM_PL_UNREF,
&arg, sizeof(arg));
}
out_err0:
free(kbo);
return NULL;
}
static int
wsbmAllocSlab(struct _WsbmSlabSizeHeader *header)
{
struct _WsbmSlab *slab;
struct _WsbmSlabBuffer *sBuf;
uint32_t numBuffers;
uint32_t ret;
uint32_t i;
slab = calloc(1, sizeof(*slab));
if (!slab)
return -ENOMEM;
slab->kbo = wsbmAllocKernelBO(header);
if (!slab->kbo) {
ret = -ENOMEM;
goto out_err0;
}
numBuffers = slab->kbo->actualSize / header->bufSize;
slab->buffers = calloc(numBuffers, sizeof(*slab->buffers));
if (!slab->buffers) {
ret = -ENOMEM;
goto out_err1;
}
WSBMINITLISTHEAD(&slab->head);
WSBMINITLISTHEAD(&slab->freeBuffers);
slab->numBuffers = numBuffers;
slab->numFree = 0;
slab->header = header;
sBuf = slab->buffers;
for (i = 0; i < numBuffers; ++i) {
ret = wsbmBufStorageInit(&sBuf->storage, &header->slabPool->pool);
if (ret)
goto out_err2;
sBuf->parent = slab;
sBuf->start = i * header->bufSize;
sBuf->virtual = (void *)((uint8_t *) slab->kbo->virtual +
sBuf->start);
wsbmAtomicSet(&sBuf->writers, 0);
sBuf->isSlabBuffer = 1;
WSBM_COND_INIT(&sBuf->event);
WSBMLISTADDTAIL(&sBuf->head, &slab->freeBuffers);
slab->numFree++;
sBuf++;
}
WSBMLISTADDTAIL(&slab->head, &header->slabs);
return 0;
out_err2:
sBuf = slab->buffers;
for (i = 0; i < numBuffers; ++i) {
if (sBuf->parent == slab) {
WSBM_COND_FREE(&sBuf->event);
wsbmBufStorageTakedown(&sBuf->storage);
}
sBuf++;
}
free(slab->buffers);
out_err1:
wsbmSetKernelBOFree(header->slabPool->cache, slab->kbo);
out_err0:
free(slab);
return ret;
}
/*
* Delete a buffer from the slab header delayed list and put
* it on the slab free list.
*/
static void
wsbmSlabFreeBufferLocked(struct _WsbmSlabBuffer *buf)
{
struct _WsbmSlab *slab = buf->parent;
struct _WsbmSlabSizeHeader *header = slab->header;
struct _WsbmListHead *list = &buf->head;
WSBMLISTDEL(list);
WSBMLISTADDTAIL(list, &slab->freeBuffers);
slab->numFree++;
if (slab->head.next == &slab->head)
WSBMLISTADDTAIL(&slab->head, &header->slabs);
if (slab->numFree == slab->numBuffers) {
list = &slab->head;
WSBMLISTDEL(list);
WSBMLISTADDTAIL(list, &header->freeSlabs);
}
if (header->slabs.next == &header->slabs ||
slab->numFree != slab->numBuffers) {
struct _WsbmListHead *next;
struct _WsbmSlabCache *cache = header->slabPool->cache;
WSBMLISTFOREACHSAFE(list, next, &header->freeSlabs) {
uint32_t i;
struct _WsbmSlabBuffer *sBuf;
slab = WSBMLISTENTRY(list, struct _WsbmSlab, head);
WSBMLISTDELINIT(list);
sBuf = slab->buffers;
for (i = 0; i < slab->numBuffers; ++i) {
if (sBuf->parent == slab) {
WSBM_COND_FREE(&sBuf->event);
wsbmBufStorageTakedown(&sBuf->storage);
}
sBuf++;
}
wsbmSetKernelBOFree(cache, slab->kbo);
free(slab->buffers);
free(slab);
}
}
}
static void
wsbmSlabCheckFreeLocked(struct _WsbmSlabSizeHeader *header, int wait)
{
struct _WsbmListHead *list, *prev, *first, *head;
struct _WsbmSlabBuffer *sBuf;
struct _WsbmSlab *slab;
int firstWasSignaled = 1;
int signaled;
uint32_t i;
int ret;
/*
* Rerun the freeing test if the youngest tested buffer
* was signaled, since there might be more idle buffers
* in the delay list.
*/
while (firstWasSignaled) {
firstWasSignaled = 0;
signaled = 0;
first = header->delayedBuffers.next;
/* Only examine the oldest 1/3 of delayed buffers:
*/
if (header->numDelayed > 3) {
for (i = 0; i < header->numDelayed; i += 3) {
first = first->next;
}
}
/*
* No need to take the buffer mutex for each buffer we loop
* through since we're currently the only user.
*/
head = first->next;
WSBMLISTFOREACHPREVSAFE(list, prev, head) {
if (list == &header->delayedBuffers)
break;
sBuf = WSBMLISTENTRY(list, struct _WsbmSlabBuffer, head);
slab = sBuf->parent;
if (!signaled) {
if (wait) {
ret = wsbmFenceFinish(sBuf->fence, sBuf->fenceType, 0);
if (ret)
break;
signaled = 1;
wait = 0;
} else {
signaled =
wsbmFenceSignaled(sBuf->fence, sBuf->fenceType);
#ifdef DEBUG_FENCESIGNALED
fencesignaled++;
#endif
}
if (signaled) {
if (list == first)
firstWasSignaled = 1;
wsbmFenceUnreference(&sBuf->fence);
header->numDelayed--;
wsbmSlabFreeBufferLocked(sBuf);
} else
break;
} else if (wsbmFenceSignaledCached(sBuf->fence, sBuf->fenceType)) {
wsbmFenceUnreference(&sBuf->fence);
header->numDelayed--;
wsbmSlabFreeBufferLocked(sBuf);
}
}
}
}
static struct _WsbmSlabBuffer *
wsbmSlabAllocBuffer(struct _WsbmSlabSizeHeader *header)
{
static struct _WsbmSlabBuffer *buf;
struct _WsbmSlab *slab;
struct _WsbmListHead *list;
int count = WSBM_SLABPOOL_ALLOC_RETRIES;
WSBM_MUTEX_LOCK(&header->mutex);
while (header->slabs.next == &header->slabs && count > 0) {
wsbmSlabCheckFreeLocked(header, 0);
if (header->slabs.next != &header->slabs)
break;
WSBM_MUTEX_UNLOCK(&header->mutex);
if (count != WSBM_SLABPOOL_ALLOC_RETRIES)
usleep(1000);
WSBM_MUTEX_LOCK(&header->mutex);
(void)wsbmAllocSlab(header);
count--;
}
list = header->slabs.next;
if (list == &header->slabs) {
WSBM_MUTEX_UNLOCK(&header->mutex);
return NULL;
}
slab = WSBMLISTENTRY(list, struct _WsbmSlab, head);
if (--slab->numFree == 0)
WSBMLISTDELINIT(list);
list = slab->freeBuffers.next;
WSBMLISTDELINIT(list);
WSBM_MUTEX_UNLOCK(&header->mutex);
buf = WSBMLISTENTRY(list, struct _WsbmSlabBuffer, head);
buf->storage.destroyContainer = NULL;
#ifdef DEBUG_FENCESIGNALED
createbuffer++;
#endif
return buf;
}
static struct _WsbmBufStorage *
pool_create(struct _WsbmBufferPool *pool, unsigned long size,
uint32_t placement, unsigned alignment)
{
struct _WsbmSlabPool *slabPool = slabPoolFromPool(pool);
struct _WsbmSlabSizeHeader *header;
struct _WsbmSlabBuffer *sBuf;
uint32_t i;
int ret;
/*
* FIXME: Check for compatibility.
*/
header = slabPool->headers;
for (i = 0; i < slabPool->numBuckets; ++i) {
if (header->bufSize >= size)
break;
header++;
}
if (i < slabPool->numBuckets) {
sBuf = wsbmSlabAllocBuffer(header);
return ((sBuf) ? &sBuf->storage : NULL);
}
/*
* Fall back to allocate a buffer object directly from DRM.
* and wrap it in a wsbmBO structure.
*/
sBuf = calloc(1, sizeof(*sBuf));
if (!sBuf)
return NULL;
if (alignment) {
if ((alignment < slabPool->pageSize)
&& (slabPool->pageSize % alignment))
goto out_err0;
if ((alignment > slabPool->pageSize)
&& (alignment % slabPool->pageSize))
goto out_err0;
}
ret = wsbmBufStorageInit(&sBuf->storage, pool);
if (ret)
goto out_err0;
ret = WSBM_COND_INIT(&sBuf->event);
if (ret)
goto out_err1;
{
union ttm_pl_create_arg arg;
arg.req.size = size;
arg.req.placement = placement;
arg.req.page_alignment = alignment / slabPool->pageSize;
DRMRESTARTCOMMANDWRITEREAD(pool->fd,
slabPool->devOffset + TTM_PL_CREATE,
arg, ret);
if (ret)
goto out_err2;
sBuf->kBuf.gpuOffset = arg.rep.gpu_offset;
sBuf->kBuf.placement = arg.rep.placement;
sBuf->kBuf.handle = arg.rep.handle;
sBuf->mapHandle = arg.rep.map_handle;
sBuf->requestedSize = size;
sBuf->virtual = mmap(0, size, PROT_READ | PROT_WRITE, MAP_SHARED,
pool->fd, sBuf->mapHandle);
if (sBuf->virtual == MAP_FAILED)
goto out_err3;
}
wsbmAtomicSet(&sBuf->writers, 0);
return &sBuf->storage;
out_err3:
{
struct ttm_pl_reference_req arg;
arg.handle = sBuf->kBuf.handle;
(void)drmCommandWriteRead(pool->fd,
slabPool->devOffset + TTM_PL_UNREF,
&arg, sizeof(arg));
}
out_err2:
WSBM_COND_FREE(&sBuf->event);
out_err1:
wsbmBufStorageTakedown(&sBuf->storage);
out_err0:
free(sBuf);
return NULL;
}
static void
pool_destroy(struct _WsbmBufStorage **p_buf)
{
struct _WsbmBufStorage *buf = *p_buf;
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
struct _WsbmSlab *slab;
struct _WsbmSlabSizeHeader *header;
*p_buf = NULL;
if (!sBuf->isSlabBuffer) {
struct _WsbmSlabPool *slabPool = slabPoolFromBuf(sBuf);
struct ttm_pl_reference_req arg;
if (sBuf->virtual != NULL) {
(void)munmap(sBuf->virtual, sBuf->requestedSize);
sBuf->virtual = NULL;
}
arg.handle = sBuf->kBuf.handle;
(void)drmCommandWrite(slabPool->pool.fd,
slabPool->devOffset + TTM_PL_UNREF,
&arg, sizeof(arg));
WSBM_COND_FREE(&sBuf->event);
wsbmBufStorageTakedown(&sBuf->storage);
free(sBuf);
return;
}
slab = sBuf->parent;
header = slab->header;
/*
* No need to take the buffer mutex below since we're the only user.
*/
WSBM_MUTEX_LOCK(&header->mutex);
sBuf->unFenced = 0;
wsbmAtomicSet(&sBuf->writers, 0);
wsbmAtomicSet(&sBuf->storage.refCount, 1);
if (sBuf->fence && !wsbmFenceSignaledCached(sBuf->fence, sBuf->fenceType)) {
WSBMLISTADDTAIL(&sBuf->head, &header->delayedBuffers);
header->numDelayed++;
} else {
if (sBuf->fence)
wsbmFenceUnreference(&sBuf->fence);
wsbmSlabFreeBufferLocked(sBuf);
}
WSBM_MUTEX_UNLOCK(&header->mutex);
}
static void
waitIdleLocked(struct _WsbmSlabBuffer *sBuf, int lazy)
{
struct _WsbmBufStorage *storage = &sBuf->storage;
while (sBuf->unFenced || sBuf->fence != NULL) {
if (sBuf->unFenced)
WSBM_COND_WAIT(&sBuf->event, &storage->mutex);
if (sBuf->fence != NULL) {
if (!wsbmFenceSignaled(sBuf->fence, sBuf->fenceType)) {
struct _WsbmFenceObject *fence =
wsbmFenceReference(sBuf->fence);
WSBM_MUTEX_UNLOCK(&storage->mutex);
(void)wsbmFenceFinish(fence, sBuf->fenceType, lazy);
WSBM_MUTEX_LOCK(&storage->mutex);
if (sBuf->fence == fence)
wsbmFenceUnreference(&sBuf->fence);
wsbmFenceUnreference(&fence);
} else {
wsbmFenceUnreference(&sBuf->fence);
}
}
}
}
static int
pool_waitIdle(struct _WsbmBufStorage *buf, int lazy)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
WSBM_MUTEX_LOCK(&buf->mutex);
waitIdleLocked(sBuf, lazy);
WSBM_MUTEX_UNLOCK(&buf->mutex);
return 0;
}
static int
pool_map(struct _WsbmBufStorage *buf, unsigned mode __attribute__ ((unused)), void **virtual)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
*virtual = sBuf->virtual;
return 0;
}
static void
pool_releaseFromCpu(struct _WsbmBufStorage *buf, unsigned mode __attribute__ ((unused)))
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
if (wsbmAtomicDecZero(&sBuf->writers))
WSBM_COND_BROADCAST(&sBuf->event);
}
static int
pool_syncForCpu(struct _WsbmBufStorage *buf, unsigned mode)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
int ret = 0;
WSBM_MUTEX_LOCK(&buf->mutex);
if ((mode & WSBM_SYNCCPU_DONT_BLOCK)) {
int signaled;
if (sBuf->unFenced) {
ret = -EBUSY;
goto out_unlock;
}
if (sBuf->isSlabBuffer)
signaled = (sBuf->fence == NULL) ||
wsbmFenceSignaledCached(sBuf->fence, sBuf->fenceType);
else
signaled = (sBuf->fence == NULL) ||
wsbmFenceSignaled(sBuf->fence, sBuf->fenceType);
ret = 0;
if (signaled) {
wsbmFenceUnreference(&sBuf->fence);
wsbmAtomicInc(&sBuf->writers);
} else
ret = -EBUSY;
goto out_unlock;
}
waitIdleLocked(sBuf, 0);
wsbmAtomicInc(&sBuf->writers);
out_unlock:
WSBM_MUTEX_UNLOCK(&buf->mutex);
return ret;
}
static void
pool_unmap(struct _WsbmBufStorage *buf __attribute__ ((unused)))
{
;
}
static unsigned long
pool_poolOffset(struct _WsbmBufStorage *buf)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
return sBuf->start;
}
static unsigned long
pool_size(struct _WsbmBufStorage *buf)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
if (!sBuf->isSlabBuffer)
return sBuf->requestedSize;
return sBuf->parent->header->bufSize;
}
static struct _WsbmKernelBuf *
pool_kernel(struct _WsbmBufStorage *buf)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
return (sBuf->isSlabBuffer) ? &sBuf->parent->kbo->kBuf : &sBuf->kBuf;
}
static unsigned long
pool_offset(struct _WsbmBufStorage *buf)
{
return pool_kernel(buf)->gpuOffset + pool_poolOffset(buf);
}
static void
pool_fence(struct _WsbmBufStorage *buf, struct _WsbmFenceObject *fence)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
struct _WsbmKernelBuf *kBuf;
WSBM_MUTEX_LOCK(&buf->mutex);
if (sBuf->fence)
wsbmFenceUnreference(&sBuf->fence);
kBuf = pool_kernel(buf);
sBuf->fenceType = kBuf->fence_type_mask;
if (!wsbmFenceSignaledCached(fence, sBuf->fenceType))
sBuf->fence = wsbmFenceReference(fence);
sBuf->unFenced = 0;
WSBM_COND_BROADCAST(&sBuf->event);
WSBM_MUTEX_UNLOCK(&buf->mutex);
}
static int
pool_validate(struct _WsbmBufStorage *buf,
uint64_t set_flags __attribute__ ((unused)), uint64_t clr_flags __attribute__ ((unused)))
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
WSBM_MUTEX_LOCK(&buf->mutex);
while (wsbmAtomicRead(&sBuf->writers) != 0) {
WSBM_COND_WAIT(&sBuf->event, &buf->mutex);
}
sBuf->unFenced = 1;
WSBM_MUTEX_UNLOCK(&buf->mutex);
return 0;
}
static void
pool_unvalidate(struct _WsbmBufStorage *buf)
{
struct _WsbmSlabBuffer *sBuf = slabBuffer(buf);
WSBM_MUTEX_LOCK(&buf->mutex);
if (sBuf->unFenced) {
sBuf->unFenced = 0;
WSBM_COND_BROADCAST(&sBuf->event);
}
WSBM_MUTEX_UNLOCK(&buf->mutex);
}
struct _WsbmSlabCache *
wsbmSlabCacheInit(uint32_t checkIntervalMsec, uint32_t slabTimeoutMsec)
{
struct _WsbmSlabCache *tmp;
tmp = calloc(1, sizeof(*tmp));
if (!tmp)
return NULL;
WSBM_MUTEX_INIT(&tmp->mutex);
WSBM_MUTEX_LOCK(&tmp->mutex);
tmp->slabTimeout.tv_usec = slabTimeoutMsec * 1000;
tmp->slabTimeout.tv_sec = tmp->slabTimeout.tv_usec / 1000000;
tmp->slabTimeout.tv_usec -= tmp->slabTimeout.tv_sec * 1000000;
tmp->checkInterval.tv_usec = checkIntervalMsec * 1000;
tmp->checkInterval.tv_sec = tmp->checkInterval.tv_usec / 1000000;
tmp->checkInterval.tv_usec -= tmp->checkInterval.tv_sec * 1000000;
gettimeofday(&tmp->nextCheck, NULL);
wsbmTimeAdd(&tmp->nextCheck, &tmp->checkInterval);
WSBMINITLISTHEAD(&tmp->timeoutList);
WSBMINITLISTHEAD(&tmp->unCached);
WSBMINITLISTHEAD(&tmp->cached);
WSBM_MUTEX_UNLOCK(&tmp->mutex);
return tmp;
}
void
wsbmSlabCacheFinish(struct _WsbmSlabCache *cache)
{
struct timeval time;
time = cache->nextCheck;
WSBM_MUTEX_LOCK(&cache->mutex);
wsbmTimeAdd(&time, &cache->checkInterval);
wsbmFreeTimeoutKBOsLocked(cache, &time);
WSBM_MUTEX_UNLOCK(&cache->mutex);
assert(cache->timeoutList.next == &cache->timeoutList);
assert(cache->unCached.next == &cache->unCached);
assert(cache->cached.next == &cache->cached);
WSBM_MUTEX_FREE(&cache->mutex);
free(cache);
}
static void
wsbmInitSizeHeader(struct _WsbmSlabPool *slabPool, uint32_t size,
struct _WsbmSlabSizeHeader *header)
{
WSBM_MUTEX_INIT(&header->mutex);
WSBM_MUTEX_LOCK(&header->mutex);
WSBMINITLISTHEAD(&header->slabs);
WSBMINITLISTHEAD(&header->freeSlabs);
WSBMINITLISTHEAD(&header->delayedBuffers);
header->numDelayed = 0;
header->slabPool = slabPool;
header->bufSize = size;
WSBM_MUTEX_UNLOCK(&header->mutex);
}
static void
wsbmFinishSizeHeader(struct _WsbmSlabSizeHeader *header)
{
struct _WsbmListHead *list, *next;
struct _WsbmSlabBuffer *sBuf;
WSBM_MUTEX_LOCK(&header->mutex);
WSBMLISTFOREACHSAFE(list, next, &header->delayedBuffers) {
sBuf = WSBMLISTENTRY(list, struct _WsbmSlabBuffer, head);
if (sBuf->fence) {
(void)wsbmFenceFinish(sBuf->fence, sBuf->fenceType, 0);
wsbmFenceUnreference(&sBuf->fence);
}
header->numDelayed--;
wsbmSlabFreeBufferLocked(sBuf);
}
WSBM_MUTEX_UNLOCK(&header->mutex);
WSBM_MUTEX_FREE(&header->mutex);
}
static void
pool_takedown(struct _WsbmBufferPool *pool)
{
struct _WsbmSlabPool *slabPool = slabPoolFromPool(pool);
unsigned int i;
for (i = 0; i < slabPool->numBuckets; ++i) {
wsbmFinishSizeHeader(&slabPool->headers[i]);
}
free(slabPool->headers);
free(slabPool->bucketSizes);
free(slabPool);
}
struct _WsbmBufferPool *
wsbmSlabPoolInit(int fd,
uint32_t devOffset,
uint32_t placement,
uint32_t validMask,
uint32_t smallestSize,
uint32_t numSizes,
uint32_t desiredNumBuffers,
uint32_t maxSlabSize,
uint32_t pageAlignment, struct _WsbmSlabCache *cache)
{
struct _WsbmBufferPool *pool;
struct _WsbmSlabPool *slabPool;
uint32_t i;
slabPool = calloc(1, sizeof(*slabPool));
if (!slabPool)
return NULL;
pool = &slabPool->pool;
slabPool->bucketSizes = calloc(numSizes, sizeof(*slabPool->bucketSizes));
if (!slabPool->bucketSizes)
goto out_err0;
slabPool->headers = calloc(numSizes, sizeof(*slabPool->headers));
if (!slabPool->headers)
goto out_err1;
slabPool->devOffset = devOffset;
slabPool->cache = cache;
slabPool->proposedPlacement = placement;
slabPool->validMask = validMask;
slabPool->numBuckets = numSizes;
slabPool->pageSize = getpagesize();
slabPool->pageAlignment = pageAlignment;
slabPool->maxSlabSize = maxSlabSize;
slabPool->desiredNumBuffers = desiredNumBuffers;
for (i = 0; i < slabPool->numBuckets; ++i) {
slabPool->bucketSizes[i] = (smallestSize << i);
wsbmInitSizeHeader(slabPool, slabPool->bucketSizes[i],
&slabPool->headers[i]);
}
pool->fd = fd;
pool->map = &pool_map;
pool->unmap = &pool_unmap;
pool->destroy = &pool_destroy;
pool->offset = &pool_offset;
pool->poolOffset = &pool_poolOffset;
pool->size = &pool_size;
pool->create = &pool_create;
pool->fence = &pool_fence;
pool->kernel = &pool_kernel;
pool->validate = &pool_validate;
pool->unvalidate = &pool_unvalidate;
pool->waitIdle = &pool_waitIdle;
pool->takeDown = &pool_takedown;
pool->releasefromcpu = &pool_releaseFromCpu;
pool->syncforcpu = &pool_syncForCpu;
return pool;
out_err1:
free(slabPool->bucketSizes);
out_err0:
free(slabPool);
return NULL;
}