lovr/src/modules/graphics/graphics.c

485 lines
17 KiB
C
Raw Normal View History

2016-11-19 09:28:01 +00:00
#include "graphics/graphics.h"
2022-04-30 03:38:34 +00:00
#include "data/image.h"
2022-04-21 07:27:13 +00:00
#include "core/gpu.h"
2022-04-27 05:51:24 +00:00
#include "core/os.h"
2022-04-21 07:27:13 +00:00
#include "util.h"
2022-04-30 03:38:34 +00:00
#include <math.h>
#include <stdlib.h>
2022-04-20 07:38:21 +00:00
#include <string.h>
2022-04-27 05:44:44 +00:00
#define MAX_FRAME_MEMORY (1 << 30)
struct Buffer {
uint32_t ref;
uint32_t size;
gpu_buffer* gpu;
BufferInfo info;
2022-04-27 07:35:09 +00:00
char* pointer;
};
2022-04-30 03:38:34 +00:00
struct Texture {
uint32_t ref;
gpu_texture* gpu;
gpu_texture* renderView;
TextureInfo info;
};
struct Pass {
uint32_t ref;
PassInfo info;
gpu_stream* stream;
};
2022-04-27 05:44:44 +00:00
typedef struct {
char* memory;
uint32_t cursor;
uint32_t length;
} Allocator;
2019-06-27 08:47:08 +00:00
static struct {
bool initialized;
bool active;
uint32_t tick;
Pass* transfers;
2022-04-22 20:28:59 +00:00
gpu_device_info device;
gpu_features features;
gpu_limits limits;
2022-04-27 05:44:44 +00:00
Allocator allocator;
2019-06-27 08:47:08 +00:00
} state;
2016-07-07 07:04:24 +00:00
2022-04-21 07:27:13 +00:00
// Helpers
static void* tempAlloc(size_t size);
static void beginFrame(void);
static gpu_stream* getTransfers(void);
2022-04-30 03:38:34 +00:00
static size_t measureTexture(TextureFormat format, uint16_t w, uint16_t h, uint16_t d);
2022-04-21 07:27:13 +00:00
static void onMessage(void* context, const char* message, bool severe);
// Entry
bool lovrGraphicsInit(bool debug) {
2022-04-19 02:30:58 +00:00
if (state.initialized) return false;
2022-04-21 07:27:13 +00:00
2022-04-27 07:28:39 +00:00
float16Init();
2022-04-21 07:27:13 +00:00
gpu_config config = {
.debug = debug,
.callback = onMessage,
.engineName = "LOVR",
.engineVersion = { LOVR_VERSION_MAJOR, LOVR_VERSION_MINOR, LOVR_VERSION_PATCH },
.device = &state.device,
.features = &state.features,
.limits = &state.limits
2022-04-21 07:27:13 +00:00
};
if (!gpu_init(&config)) {
lovrThrow("Failed to initialize GPU");
}
2022-04-27 05:44:44 +00:00
// Temporary frame memory uses a large 1GB virtual memory allocation, committing pages as needed
state.allocator.length = 1 << 14;
state.allocator.memory = os_vm_init(MAX_FRAME_MEMORY);
os_vm_commit(state.allocator.memory, state.allocator.length);
2022-04-19 02:30:58 +00:00
state.initialized = true;
return true;
2016-09-28 03:20:08 +00:00
}
void lovrGraphicsDestroy() {
if (!state.initialized) return;
2022-04-21 07:27:13 +00:00
gpu_destroy();
2022-04-27 05:44:44 +00:00
os_vm_free(state.allocator.memory, MAX_FRAME_MEMORY);
2019-06-27 08:47:08 +00:00
memset(&state, 0, sizeof(state));
2016-07-07 07:04:24 +00:00
}
2022-04-21 07:27:13 +00:00
void lovrGraphicsGetDevice(GraphicsDevice* device) {
2022-04-22 20:28:59 +00:00
device->deviceId = state.device.deviceId;
device->vendorId = state.device.vendorId;
device->name = state.device.deviceName;
device->renderer = state.device.renderer;
device->subgroupSize = state.device.subgroupSize;
2022-04-22 20:28:59 +00:00
device->discrete = state.device.discrete;
}
void lovrGraphicsGetFeatures(GraphicsFeatures* features) {
features->textureBC = state.features.textureBC;
features->textureASTC = state.features.textureASTC;
features->wireframe = state.features.wireframe;
features->depthClamp = state.features.depthClamp;
features->indirectDrawFirstInstance = state.features.indirectDrawFirstInstance;
features->float64 = state.features.float64;
features->int64 = state.features.int64;
features->int16 = state.features.int16;
}
void lovrGraphicsGetLimits(GraphicsLimits* limits) {
limits->textureSize2D = state.limits.textureSize2D;
limits->textureSize3D = state.limits.textureSize3D;
limits->textureSizeCube = state.limits.textureSizeCube;
limits->textureLayers = state.limits.textureLayers;
limits->renderSize[0] = state.limits.renderSize[0];
limits->renderSize[1] = state.limits.renderSize[1];
limits->renderSize[2] = state.limits.renderSize[2];
limits->uniformBufferRange = state.limits.uniformBufferRange;
limits->storageBufferRange = state.limits.storageBufferRange;
limits->uniformBufferAlign = state.limits.uniformBufferAlign;
limits->storageBufferAlign = state.limits.storageBufferAlign;
limits->vertexAttributes = state.limits.vertexAttributes;
limits->vertexBufferStride = state.limits.vertexBufferStride;
limits->vertexShaderOutputs = state.limits.vertexShaderOutputs;
limits->clipDistances = state.limits.clipDistances;
limits->cullDistances = state.limits.cullDistances;
limits->clipAndCullDistances = state.limits.clipAndCullDistances;
memcpy(limits->computeDispatchCount, state.limits.computeDispatchCount, 3 * sizeof(uint32_t));
memcpy(limits->computeWorkgroupSize, state.limits.computeWorkgroupSize, 3 * sizeof(uint32_t));
limits->computeWorkgroupVolume = state.limits.computeWorkgroupVolume;
limits->computeSharedMemory = state.limits.computeSharedMemory;
limits->shaderConstantSize = state.limits.pushConstantSize;
limits->indirectDrawCount = state.limits.indirectDrawCount;
limits->instances = state.limits.instances;
limits->anisotropy = state.limits.anisotropy;
limits->pointSize = state.limits.pointSize;
}
2022-04-30 00:12:10 +00:00
bool lovrGraphicsIsFormatSupported(uint32_t format, uint32_t features) {
uint8_t supports = state.features.formats[format];
if (!features) return supports;
if ((features & TEXTURE_FEATURE_SAMPLE) && !(supports & GPU_FEATURE_SAMPLE)) return false;
if ((features & TEXTURE_FEATURE_FILTER) && !(supports & GPU_FEATURE_FILTER)) return false;
if ((features & TEXTURE_FEATURE_RENDER) && !(supports & GPU_FEATURE_RENDER)) return false;
if ((features & TEXTURE_FEATURE_BLEND) && !(supports & GPU_FEATURE_BLEND)) return false;
if ((features & TEXTURE_FEATURE_STORAGE) && !(supports & GPU_FEATURE_STORAGE)) return false;
if ((features & TEXTURE_FEATURE_ATOMIC) && !(supports & GPU_FEATURE_ATOMIC)) return false;
if ((features & TEXTURE_FEATURE_BLIT_SRC) && !(supports & GPU_FEATURE_BLIT_SRC)) return false;
if ((features & TEXTURE_FEATURE_BLIT_DST) && !(supports & GPU_FEATURE_BLIT_DST)) return false;
return true;
}
void lovrGraphicsSubmit(Pass** passes, uint32_t count) {
if (!state.active) {
return;
}
// Allocate a few extra stream handles for any internal passes we sneak in
gpu_stream** streams = tempAlloc((count + 3) * sizeof(gpu_stream*));
uint32_t extraPassCount = 0;
if (state.transfers) {
streams[extraPassCount++] = state.transfers->stream;
}
for (uint32_t i = 0; i < count; i++) {
streams[extraPassCount + i] = passes[i]->stream;
}
for (uint32_t i = 0; i < extraPassCount + count; i++) {
gpu_stream_end(streams[i]);
}
gpu_submit(streams, extraPassCount + count);
state.transfers = NULL;
state.active = false;
}
2022-04-29 05:37:03 +00:00
void lovrGraphicsWait() {
gpu_wait();
}
// Buffer
2022-04-27 07:28:39 +00:00
Buffer* lovrGraphicsGetBuffer(BufferInfo* info, void** data) {
uint32_t size = info->length * info->stride;
2022-04-27 07:28:39 +00:00
lovrCheck(size > 0, "Buffer size can not be zero");
2022-04-30 03:38:34 +00:00
lovrCheck(size <= 1 << 30, "Max buffer size is 1GB");
2022-04-27 07:28:39 +00:00
Buffer* buffer = tempAlloc(sizeof(Buffer) + gpu_sizeof_buffer());
2022-04-27 07:28:39 +00:00
buffer->ref = 1;
buffer->size = size;
buffer->gpu = (gpu_buffer*) (buffer + 1);
buffer->info = *info;
buffer->pointer = gpu_map(buffer->gpu, size, state.limits.uniformBufferAlign, GPU_MAP_WRITE);
if (data) {
*data = buffer->pointer;
}
return buffer;
}
Buffer* lovrBufferCreate(BufferInfo* info, void** data) {
uint32_t size = info->length * info->stride;
lovrCheck(size > 0, "Buffer size can not be zero");
lovrCheck(size <= 1 << 30, "Max buffer size is 1GB");
Buffer* buffer = calloc(1, sizeof(Buffer) + gpu_sizeof_buffer());
lovrAssert(buffer, "Out of memory");
buffer->ref = 1;
buffer->size = size;
buffer->gpu = (gpu_buffer*) (buffer + 1);
buffer->info = *info;
gpu_buffer_init(buffer->gpu, &(gpu_buffer_info) {
.size = buffer->size,
.label = info->label,
.pointer = data
});
2022-04-27 07:28:39 +00:00
if (data && *data == NULL) {
gpu_buffer* scratchpad = tempAlloc(gpu_sizeof_buffer());
2022-04-27 07:28:39 +00:00
*data = gpu_map(scratchpad, size, 4, GPU_MAP_WRITE);
// TODO copy scratchpad to buffer
}
return buffer;
}
void lovrBufferDestroy(void* ref) {
Buffer* buffer = ref;
2022-04-27 07:28:39 +00:00
if (buffer->pointer) return;
gpu_buffer_destroy(buffer->gpu);
free(buffer);
}
const BufferInfo* lovrBufferGetInfo(Buffer* buffer) {
return &buffer->info;
}
2022-04-27 07:28:39 +00:00
bool lovrBufferIsTemporary(Buffer* buffer) {
return !!buffer->pointer;
}
void* lovrBufferMap(Buffer* buffer, uint32_t offset, uint32_t size) {
if (size == ~0u) {
size = buffer->size - offset;
}
lovrCheck(offset + size <= buffer->size, "Buffer write range [%d,%d] exceeds buffer size", offset, offset + size);
if (buffer->pointer) {
2022-04-27 07:35:09 +00:00
return buffer->pointer + offset;
2022-04-27 07:28:39 +00:00
}
gpu_stream* transfers = getTransfers();
gpu_buffer* scratchpad = tempAlloc(gpu_sizeof_buffer());
void* data = gpu_map(scratchpad, size, 4, GPU_MAP_WRITE);
gpu_copy_buffers(transfers, scratchpad, buffer->gpu, 0, offset, size);
return data;
2022-04-27 07:28:39 +00:00
}
void lovrBufferClear(Buffer* buffer, uint32_t offset, uint32_t size) {
lovrCheck(size % 4 == 0, "Buffer clear size must be a multiple of 4");
lovrCheck(offset % 4 == 0, "Buffer clear offset must be a multiple of 4");
2022-04-27 07:28:39 +00:00
lovrCheck(offset + size <= buffer->size, "Tried to clear past the end of the Buffer");
if (buffer->pointer) {
2022-04-27 07:35:09 +00:00
memset(buffer->pointer + offset, 0, size);
2022-04-27 07:28:39 +00:00
} else {
gpu_stream* transfers = getTransfers();
gpu_clear_buffer(transfers, buffer->gpu, offset, size);
2022-04-27 07:28:39 +00:00
}
}
2022-04-30 03:38:34 +00:00
// Texture
Texture* lovrTextureCreate(TextureInfo* info) {
uint32_t limits[] = {
[TEXTURE_2D] = state.limits.textureSize2D,
[TEXTURE_CUBE] = state.limits.textureSizeCube,
[TEXTURE_ARRAY] = state.limits.textureSize2D,
[TEXTURE_VOLUME] = state.limits.textureSize3D
};
uint32_t limit = limits[info->type];
uint32_t mips = log2(MAX(MAX(info->width, info->height), (info->type == TEXTURE_VOLUME ? info->depth : 1))) + 1;
uint8_t supports = state.features.formats[info->format];
lovrCheck(info->width > 0, "Texture width must be greater than zero");
lovrCheck(info->height > 0, "Texture height must be greater than zero");
lovrCheck(info->depth > 0, "Texture depth must be greater than zero");
lovrCheck(info->width <= limit, "Texture %s exceeds the limit for this texture type (%d)", "width", limit);
lovrCheck(info->height <= limit, "Texture %s exceeds the limit for this texture type (%d)", "height", limit);
lovrCheck(info->depth <= limit || info->type != TEXTURE_VOLUME, "Texture %s exceeds the limit for this texture type (%d)", "depth", limit);
lovrCheck(info->depth <= state.limits.textureLayers || info->type != TEXTURE_ARRAY, "Texture %s exceeds the limit for this texture type (%d)", "depth", limit);
lovrCheck(info->depth == 1 || info->type != TEXTURE_2D, "2D textures must have a depth of 1");
lovrCheck(info->depth == 6 || info->type != TEXTURE_CUBE, "Cubemaps must have a depth of 6");
lovrCheck(info->width == info->height || info->type != TEXTURE_CUBE, "Cubemaps must be square");
lovrCheck(measureTexture(info->format, info->width, info->height, info->depth) < 1 << 30, "Memory for a Texture can not exceed 1GB");
lovrCheck(info->samples == 1 || info->samples == 4, "Currently, Texture multisample count must be 1 or 4");
lovrCheck(info->samples == 1 || info->type != TEXTURE_CUBE, "Cubemaps can not be multisampled");
lovrCheck(info->samples == 1 || info->type != TEXTURE_VOLUME, "Volume textures can not be multisampled");
lovrCheck(info->samples == 1 || ~info->usage & TEXTURE_STORAGE, "Currently, Textures with the 'storage' flag can not be multisampled");
lovrCheck(info->samples == 1 || info->mipmaps == 1, "Multisampled textures can only have 1 mipmap");
lovrCheck(~info->usage & TEXTURE_SAMPLE || (supports & GPU_FEATURE_SAMPLE), "GPU does not support the 'sample' flag for this format");
lovrCheck(~info->usage & TEXTURE_RENDER || (supports & GPU_FEATURE_RENDER), "GPU does not support the 'render' flag for this format");
lovrCheck(~info->usage & TEXTURE_STORAGE || (supports & GPU_FEATURE_STORAGE), "GPU does not support the 'storage' flag for this format");
lovrCheck(~info->usage & TEXTURE_RENDER || info->width <= state.limits.renderSize[0], "Texture has 'render' flag but its size exceeds the renderSize limit");
lovrCheck(~info->usage & TEXTURE_RENDER || info->height <= state.limits.renderSize[1], "Texture has 'render' flag but its size exceeds the renderSize limit");
lovrCheck(info->mipmaps == ~0u || info->mipmaps <= mips, "Texture has more than the max number of mipmap levels for its size (%d)", mips);
lovrCheck((info->format < FORMAT_BC1 || info->format > FORMAT_BC7) || state.features.textureBC, "%s textures are not supported on this GPU", "BC");
lovrCheck(info->format < FORMAT_ASTC_4x4 || state.features.textureASTC, "%s textures are not supported on this GPU", "ASTC");
Texture* texture = calloc(1, sizeof(Texture) + gpu_sizeof_texture());
lovrAssert(texture, "Out of memory");
texture->ref = 1;
texture->gpu = (gpu_texture*) (texture + 1);
texture->info = *info;
texture->info.mipmaps = CLAMP(texture->info.mipmaps, 1, mips);
gpu_texture_init(texture->gpu, &(gpu_texture_info) {
.type = (gpu_texture_type) info->type,
.format = (gpu_texture_format) info->format,
.size = { info->width, info->height, info->depth },
.mipmaps = texture->info.mipmaps,
.samples = MAX(info->samples, 1),
.usage =
((info->usage & TEXTURE_SAMPLE) ? GPU_TEXTURE_SAMPLE : 0) |
((info->usage & TEXTURE_RENDER) ? GPU_TEXTURE_RENDER : 0) |
((info->usage & TEXTURE_STORAGE) ? GPU_TEXTURE_STORAGE : 0) |
((info->usage & TEXTURE_COPY) ? GPU_TEXTURE_COPY_SRC | GPU_TEXTURE_COPY_DST : 0),
.srgb = info->srgb,
.handle = info->handle,
.label = info->label
});
// Automatically create a renderable view for renderable non-volume textures
if (info->usage & TEXTURE_RENDER && info->type != TEXTURE_VOLUME && info->depth <= state.limits.renderSize[2]) {
if (info->mipmaps == 1) {
texture->renderView = texture->gpu;
} else {
gpu_texture_view_info view = {
.source = texture->gpu,
.type = GPU_TEXTURE_ARRAY,
.layerCount = info->depth,
.levelCount = 1
};
texture->renderView = malloc(gpu_sizeof_texture());
lovrAssert(texture->renderView, "Out of memory");
lovrAssert(gpu_texture_init_view(texture->renderView, &view), "Failed to create texture view");
}
}
return texture;
}
void lovrTextureDestroy(void* ref) {
Texture* texture = ref;
lovrRelease(texture->info.parent, lovrTextureDestroy);
if (texture->renderView && texture->renderView != texture->gpu) gpu_texture_destroy(texture->renderView);
if (texture->gpu) gpu_texture_destroy(texture->gpu);
free(texture);
}
// Pass
Pass* lovrGraphicsGetPass(PassInfo* info) {
beginFrame();
Pass* pass = tempAlloc(sizeof(Pass));
pass->ref = 1;
pass->info = *info;
pass->stream = gpu_stream_begin(info->label);
return pass;
}
void lovrPassDestroy(void* ref) {
//
}
const PassInfo* lovrPassGetInfo(Pass* pass) {
return &pass->info;
}
2022-04-21 07:27:13 +00:00
// Helpers
static void* tempAlloc(size_t size) {
2022-04-27 05:44:44 +00:00
while (state.allocator.cursor + size > state.allocator.length) {
lovrAssert(state.allocator.length << 1 <= MAX_FRAME_MEMORY, "Out of memory");
os_vm_commit(state.allocator.memory + state.allocator.length, state.allocator.length);
state.allocator.length <<= 1;
}
uint32_t cursor = ALIGN(state.allocator.cursor, 8);
state.allocator.cursor = cursor + size;
return state.allocator.memory + cursor;
}
static void beginFrame(void) {
if (state.active) {
return;
}
state.active = true;
state.tick = gpu_begin();
}
static gpu_stream* getTransfers(void) {
if (!state.transfers) {
state.transfers = lovrGraphicsGetPass(&(PassInfo) {
.type = PASS_TRANSFER,
.label = "Internal Transfers"
});
}
return state.transfers->stream;
}
2022-04-30 03:38:34 +00:00
// Returns number of bytes of a 3D texture region of a given format
static size_t measureTexture(TextureFormat format, uint16_t w, uint16_t h, uint16_t d) {
switch (format) {
case FORMAT_R8: return w * h * d;
case FORMAT_RG8:
case FORMAT_R16:
case FORMAT_R16F:
case FORMAT_RGB565:
case FORMAT_RGB5A1:
case FORMAT_D16: return w * h * d * 2;
case FORMAT_RGBA8:
case FORMAT_RG16:
case FORMAT_RG16F:
case FORMAT_R32F:
case FORMAT_RG11B10F:
case FORMAT_RGB10A2:
case FORMAT_D24S8:
case FORMAT_D32F: return w * h * d * 4;
case FORMAT_RGBA16:
case FORMAT_RGBA16F:
case FORMAT_RG32F: return w * h * d * 8;
case FORMAT_RGBA32F: return w * h * d * 16;
case FORMAT_BC1:
case FORMAT_BC2:
case FORMAT_BC3:
case FORMAT_BC4U:
case FORMAT_BC4S:
case FORMAT_BC5U:
case FORMAT_BC5S:
case FORMAT_BC6UF:
case FORMAT_BC6SF:
case FORMAT_BC7:
case FORMAT_ASTC_4x4: return ((w + 3) / 4) * ((h + 3) / 4) * d * 16;
case FORMAT_ASTC_5x4: return ((w + 4) / 5) * ((h + 3) / 4) * d * 16;
case FORMAT_ASTC_5x5: return ((w + 4) / 5) * ((h + 4) / 5) * d * 16;
case FORMAT_ASTC_6x5: return ((w + 5) / 6) * ((h + 4) / 5) * d * 16;
case FORMAT_ASTC_6x6: return ((w + 5) / 6) * ((h + 5) / 6) * d * 16;
case FORMAT_ASTC_8x5: return ((w + 7) / 8) * ((h + 4) / 5) * d * 16;
case FORMAT_ASTC_8x6: return ((w + 7) / 8) * ((h + 5) / 6) * d * 16;
case FORMAT_ASTC_8x8: return ((w + 7) / 8) * ((h + 7) / 8) * d * 16;
case FORMAT_ASTC_10x5: return ((w + 9) / 10) * ((h + 4) / 5) * d * 16;
case FORMAT_ASTC_10x6: return ((w + 9) / 10) * ((h + 5) / 6) * d * 16;
case FORMAT_ASTC_10x8: return ((w + 9) / 10) * ((h + 7) / 8) * d * 16;
case FORMAT_ASTC_10x10: return ((w + 9) / 10) * ((h + 9) / 10) * d * 16;
case FORMAT_ASTC_12x10: return ((w + 11) / 12) * ((h + 9) / 10) * d * 16;
case FORMAT_ASTC_12x12: return ((w + 11) / 12) * ((h + 11) / 12) * d * 16;
default: lovrUnreachable();
}
}
2022-04-21 07:27:13 +00:00
static void onMessage(void* context, const char* message, bool severe) {
if (severe) {
lovrLog(LOG_ERROR, "GPU", message);
} else {
lovrLog(LOG_DEBUG, "GPU", message);
}
}