Add uniform buffers

2024-07-22 00:27:24 +02:00 · 2024-07-22 00:27:24 +02:00 · b1bbd65aaa
commit b1bbd65aaa
parent 8c60f79f7d
13 changed files with 5695 additions and 4 deletions
--- a/build.zig
+++ b/build.zig
@ -14,6 +14,8 @@ pub fn build(b: *std.Build) void {
        .optimize = optimize,
    });
    // --- Dependencies ---
    // Vulkan
    const vkzig_dep = b.dependency("vulkan_zig", .{
        .registry = @as([]const u8, b.pathFromRoot("./vk.xml")),
@ -35,6 +37,12 @@ pub fn build(b: *std.Build) void {
    sdl_sdk.link(exe, .dynamic, .SDL2);
    exe.root_module.addImport("sdl2", sdl_sdk.getWrapperModuleVulkan(vkzig_bindings));
    // zmath
    const zmath = b.dependency("zmath", .{});
    exe.root_module.addImport("zmath", zmath.module("root"));
    // ---
    b.installArtifact(exe);
    const check = b.step("check", "Check if vulkan-test compiles");
--- a/build.zig.zon
+++ b/build.zig.zon
@ -4,6 +4,7 @@
    .version = "0.1.0",
    .dependencies = .{
        .zmath = .{ .path = "libs/zmath" },
        .vulkan_zig = .{
            .url = "https://github.com/Snektron/vulkan-zig/archive/9f6e6177b1fdb3ed22231d9216a24480e84cfa5e.tar.gz",
            .hash = "1220f2961df224f7d35dee774b26194b8b937cc252fa8e4023407776c58521d53e38",
--- a/libs/zmath/LICENSE
+++ b/libs/zmath/LICENSE
@ -0,0 +1,22 @@
 MIT License
 Copyright (c) 2021 Michal Ziulek
 Copyright (c) 2024 zig-gamedev contributors
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
 to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 copies of the Software, and to permit persons to whom the Software is
 furnished to do so, subject to the following conditions:
 The above copyright notice and this permission notice shall be included in all
 copies or substantial portions of the Software.
 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
--- a/libs/zmath/README.md
+++ b/libs/zmath/README.md
@ -0,0 +1,133 @@
 # zmath v0.10.0 - SIMD math library for game developers
 Tested on x86_64 and AArch64.
 Provides ~140 optimized routines and ~70 extensive tests.
 Can be used with any graphics API.
 Documentation can be found [here](https://github.com/michal-z/zig-gamedev/blob/main/libs/zmath/src/zmath.zig).
 Benchamrks can be found [here](https://github.com/michal-z/zig-gamedev/blob/main/libs/zmath/src/benchmark.zig).
 An intro article can be found [here](https://zig.news/michalz/fast-multi-platform-simd-math-library-in-zig-2adn).
 ## Getting started
 Copy `zmath` into a subdirectory of your project and add the following to your `build.zig.zon` .dependencies:
 ```zig
    .zmath = .{ .path = "libs/zmath" },
 ```
 Then in your `build.zig` add:
 ```zig
 pub fn build(b: *std.Build) void {
    const exe = b.addExecutable(.{ ... });
    const zmath = b.dependency("zmath", .{});
    exe.root_module.addImport("zmath", zmath.module("root"));
 }
 ```
 Now in your code you may import and use zmath:
 ```zig
 const zm = @import("zmath");
 pub fn main() !void {
    //
    // OpenGL/Vulkan example
    //
    const object_to_world = zm.rotationY(..);
    const world_to_view = zm.lookAtRh(
        zm.f32x4(3.0, 3.0, 3.0, 1.0), // eye position
        zm.f32x4(0.0, 0.0, 0.0, 1.0), // focus point
        zm.f32x4(0.0, 1.0, 0.0, 0.0), // up direction ('w' coord is zero because this is a vector not a point)
    );
    // `perspectiveFovRhGl` produces Z values in [-1.0, 1.0] range (Vulkan app should use `perspectiveFovRh`)
    const view_to_clip = zm.perspectiveFovRhGl(0.25 * math.pi, aspect_ratio, 0.1, 20.0);
    const object_to_view = zm.mul(object_to_world, world_to_view);
    const object_to_clip = zm.mul(object_to_view, view_to_clip);
    // Transposition is needed because GLSL uses column-major matrices by default
    gl.uniformMatrix4fv(0, 1, gl.TRUE, zm.arrNPtr(&object_to_clip));
    // In GLSL: gl_Position = vec4(in_position, 1.0) * object_to_clip;
    //
    // DirectX example
    //
    const object_to_world = zm.rotationY(..);
    const world_to_view = zm.lookAtLh(
        zm.f32x4(3.0, 3.0, -3.0, 1.0), // eye position
        zm.f32x4(0.0, 0.0, 0.0, 1.0), // focus point
        zm.f32x4(0.0, 1.0, 0.0, 0.0), // up direction ('w' coord is zero because this is a vector not a point)
    );
    const view_to_clip = zm.perspectiveFovLh(0.25 * math.pi, aspect_ratio, 0.1, 20.0);
    const object_to_view = zm.mul(object_to_world, world_to_view);
    const object_to_clip = zm.mul(object_to_view, view_to_clip);
    // Transposition is needed because HLSL uses column-major matrices by default
    const mem = allocateUploadMemory(...);
    zm.storeMat(mem, zm.transpose(object_to_clip));
    // In HLSL: out_position_sv = mul(float4(in_position, 1.0), object_to_clip);
    //
    // 'WASD' camera movement example
    //
    {
        const speed = zm.f32x4s(10.0);
        const delta_time = zm.f32x4s(demo.frame_stats.delta_time);
        const transform = zm.mul(zm.rotationX(demo.camera.pitch), zm.rotationY(demo.camera.yaw));
        var forward = zm.normalize3(zm.mul(zm.f32x4(0.0, 0.0, 1.0, 0.0), transform));
        zm.storeArr3(&demo.camera.forward, forward);
        const right = speed * delta_time * zm.normalize3(zm.cross3(zm.f32x4(0.0, 1.0, 0.0, 0.0), forward));
        forward = speed * delta_time * forward;
        var cam_pos = zm.loadArr3(demo.camera.position);
        if (keyDown('W')) {
            cam_pos += forward;
        } else if (keyDown('S')) {
            cam_pos -= forward;
        }
        if (keyDown('D')) {
            cam_pos += right;
        } else if (keyDown('A')) {
            cam_pos -= right;
        }
        zm.storeArr3(&demo.camera.position, cam_pos);
    }
    //
    // SIMD wave equation solver example (works with vector width 4, 8 and 16)
    // 'T' can be F32x4, F32x8 or F32x16
    //
    var z_index: i32 = 0;
    while (z_index < grid_size) : (z_index += 1) {
        const z = scale * @intToFloat(f32, z_index - grid_size / 2);
        const vz = zm.splat(T, z);
        var x_index: i32 = 0;
        while (x_index < grid_size) : (x_index += zm.veclen(T)) {
            const x = scale * @intToFloat(f32, x_index - grid_size / 2);
            const vx = zm.splat(T, x) + voffset * zm.splat(T, scale);
            const d = zm.sqrt(vx * vx + vz * vz);
            const vy = zm.sin(d - vtime);
            const index = @intCast(usize, x_index + z_index * grid_size);
            zm.store(xslice[index..], vx, 0);
            zm.store(yslice[index..], vy, 0);
            zm.store(zslice[index..], vz, 0);
        }
    }
 }
 ```
--- a/libs/zmath/build.zig
+++ b/libs/zmath/build.zig
@ -0,0 +1,62 @@
 const std = @import("std");
 pub fn build(b: *std.Build) void {
    const target = b.standardTargetOptions(.{});
    const options = .{
        .optimize = b.option(
            std.builtin.OptimizeMode,
            "optimize",
            "Select optimization mode",
        ) orelse b.standardOptimizeOption(.{
            .preferred_optimize_mode = .ReleaseFast,
        }),
        .enable_cross_platform_determinism = b.option(
            bool,
            "enable_cross_platform_determinism",
            "Enable cross-platform determinism",
        ) orelse true,
    };
    const options_step = b.addOptions();
    inline for (std.meta.fields(@TypeOf(options))) |field| {
        options_step.addOption(field.type, field.name, @field(options, field.name));
    }
    const options_module = options_step.createModule();
    const zmath = b.addModule("root", .{
        .root_source_file = b.path("src/main.zig"),
        .imports = &.{
            .{ .name = "zmath_options", .module = options_module },
        },
    });
    const test_step = b.step("test", "Run zmath tests");
    const tests = b.addTest(.{
        .name = "zmath-tests",
        .root_source_file = b.path("src/main.zig"),
        .target = target,
        .optimize = options.optimize,
    });
    b.installArtifact(tests);
    tests.root_module.addImport("zmath_options", options_module);
    test_step.dependOn(&b.addRunArtifact(tests).step);
    const benchmark_step = b.step("benchmark", "Run zmath benchmarks");
    const benchmarks = b.addExecutable(.{
        .name = "zmath-benchmarks",
        .root_source_file = b.path("src/benchmark.zig"),
        .target = target,
        .optimize = options.optimize,
    });
    b.installArtifact(benchmarks);
    benchmarks.root_module.addImport("zmath", zmath);
    benchmark_step.dependOn(&b.addRunArtifact(benchmarks).step);
 }
--- a/libs/zmath/build.zig.zon
+++ b/libs/zmath/build.zig.zon
@ -0,0 +1,10 @@
 .{
    .name = "zmath",
    .version = "0.10.0",
    .paths = .{
        "build.zig",
        "build.zig.zon",
        "src",
        "README.md",
    },
 }
--- a/libs/zmath/src/benchmark.zig
+++ b/libs/zmath/src/benchmark.zig
@ -0,0 +1,469 @@
 // -------------------------------------------------------------------------------------------------
 // zmath - benchmarks
 // -------------------------------------------------------------------------------------------------
 // 'zig build benchmark -Doptimize=ReleaseFast' will build and benchmakrs with all optimisations.
 //
 // -------------------------------------------------------------------------------------------------
 // 'AMD Ryzen 9 3950X 16-Core Processor', Windows 11, Zig 0.10.0-dev.2620+0e9458a3f, ReleaseFast
 // -------------------------------------------------------------------------------------------------
 //                matrix mul benchmark (AOS) - scalar version: 1.5880s, zmath version: 1.0642s
 //       cross3, scale, bias benchmark (AOS) - scalar version: 0.9318s, zmath version: 0.6888s
 // cross3, dot3, scale, bias benchmark (AOS) - scalar version: 1.2258s, zmath version: 1.1095s
 //            quaternion mul benchmark (AOS) - scalar version: 1.4123s, zmath version: 0.6958s
 //                      wave benchmark (SOA) - scalar version: 4.8165s, zmath version: 0.7338s
 //
 // -------------------------------------------------------------------------------------------------
 // 'AMD Ryzen 7 5800X 8-Core Processer', Linux 5.17.14, Zig 0.10.0-dev.2624+d506275a0, ReleaseFast
 // -------------------------------------------------------------------------------------------------
 //                matrix mul benchmark (AOS) - scalar version: 1.3672s, zmath version: 0.8617s
 //       cross3, scale, bias benchmark (AOS) - scalar version: 0.6586s, zmath version: 0.4803s
 // cross3, dot3, scale, bias benchmark (AOS) - scalar version: 1.0620s, zmath version: 0.8942s
 //            quaternion mul benchmark (AOS) - scalar version: 1.1324s, zmath version: 0.6064s
 //                      wave benchmark (SOA) - scalar version: 3.6598s, zmath version: 0.4231s
 //
 // -------------------------------------------------------------------------------------------------
 // 'Apple M1 Max', macOS Version 12.4, Zig 0.10.0-dev.2657+74442f350, ReleaseFast
 // -------------------------------------------------------------------------------------------------
 //                matrix mul benchmark (AOS) - scalar version: 1.0297s, zmath version: 1.0538s
 //       cross3, scale, bias benchmark (AOS) - scalar version: 0.6294s, zmath version: 0.6532s
 // cross3, dot3, scale, bias benchmark (AOS) - scalar version: 0.9807s, zmath version: 1.0988s
 //            quaternion mul benchmark (AOS) - scalar version: 1.5413s, zmath version: 0.7800s
 //                      wave benchmark (SOA) - scalar version: 3.4220s, zmath version: 1.0255s
 //
 // -------------------------------------------------------------------------------------------------
 // '11th Gen Intel(R) Core(TM) i7-11800H @ 2.30GHz', Windows 11, Zig 0.10.0-dev.2620+0e9458a3f, ReleaseFast
 // -------------------------------------------------------------------------------------------------
 //                matrix mul benchmark (AOS) - scalar version: 2.2308s, zmath version: 0.9376s
 //       cross3, scale, bias benchmark (AOS) - scalar version: 1.0821s, zmath version: 0.5110s
 // cross3, dot3, scale, bias benchmark (AOS) - scalar version: 1.6580s, zmath version: 0.9167s
 //            quaternion mul benchmark (AOS) - scalar version: 2.0139s, zmath version: 0.5856s
 //                      wave benchmark (SOA) - scalar version: 3.7832s, zmath version: 0.3642s
 //
 // -------------------------------------------------------------------------------------------------
 pub fn main() !void {
    var gpa = std.heap.GeneralPurposeAllocator(.{}){};
    defer _ = gpa.deinit();
    const allocator = gpa.allocator();
    // m = mul(ma, mb); data set fits in L1 cache; AOS data layout.
    try mat4MulBenchmark(allocator, 100_000);
    // v = 0.01 * cross3(va, vb) + vec3(1.0); data set fits in L1 cache; AOS data layout.
    try cross3ScaleBiasBenchmark(allocator, 10_000);
    // v = dot3(va, vb) * (0.1 * cross3(va, vb) + vec3(1.0)); data set fits in L1 cache; AOS data layout.
    try cross3Dot3ScaleBiasBenchmark(allocator, 10_000);
    // q = qmul(qa, qb); data set fits in L1 cache; AOS data layout.
    try quatBenchmark(allocator, 10_000);
    // d = sqrt(x * x + z * z); y = sin(d - t); SOA layout.
    try waveBenchmark(allocator, 1_000);
 }
 const std = @import("std");
 const time = std.time;
 const Timer = time.Timer;
 const zm = @import("zmath");
 var prng = std.Random.DefaultPrng.init(0);
 const random = prng.random();
 noinline fn mat4MulBenchmark(allocator: std.mem.Allocator, comptime count: comptime_int) !void {
    std.debug.print("\n", .{});
    std.debug.print("{s:>42} - ", .{"matrix mul benchmark (AOS)"});
    var data0 = std.ArrayList([16]f32).init(allocator);
    defer data0.deinit();
    var data1 = std.ArrayList([16]f32).init(allocator);
    defer data1.deinit();
    var i: usize = 0;
    while (i < 64) : (i += 1) {
        try data0.append([16]f32{
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
        });
        try data1.append([16]f32{
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
            random.float(f32), random.float(f32), random.float(f32), random.float(f32),
        });
    }
    // Warmup, fills L1 cache.
    i = 0;
    while (i < 100) : (i += 1) {
        for (data1.items) |b| {
            for (data0.items) |a| {
                const ma = zm.loadMat(a[0..]);
                const mb = zm.loadMat(b[0..]);
                const r = zm.mul(ma, mb);
                std.mem.doNotOptimizeAway(&r);
            }
        }
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const r = [16]f32{
                        a[0] * b[0] + a[1] * b[4] + a[2] * b[8] + a[3] * b[12],
                        a[0] * b[1] + a[1] * b[5] + a[2] * b[9] + a[3] * b[13],
                        a[0] * b[2] + a[1] * b[6] + a[2] * b[10] + a[3] * b[14],
                        a[0] * b[3] + a[1] * b[7] + a[2] * b[11] + a[3] * b[15],
                        a[4] * b[0] + a[5] * b[4] + a[6] * b[8] + a[7] * b[12],
                        a[4] * b[1] + a[5] * b[5] + a[6] * b[9] + a[7] * b[13],
                        a[4] * b[2] + a[5] * b[6] + a[6] * b[10] + a[7] * b[14],
                        a[4] * b[3] + a[5] * b[7] + a[6] * b[11] + a[7] * b[15],
                        a[8] * b[0] + a[9] * b[4] + a[10] * b[8] + a[11] * b[12],
                        a[8] * b[1] + a[9] * b[5] + a[10] * b[9] + a[11] * b[13],
                        a[8] * b[2] + a[9] * b[6] + a[10] * b[10] + a[11] * b[14],
                        a[8] * b[3] + a[9] * b[7] + a[10] * b[11] + a[11] * b[15],
                        a[12] * b[0] + a[13] * b[4] + a[14] * b[8] + a[15] * b[12],
                        a[12] * b[1] + a[13] * b[5] + a[14] * b[9] + a[15] * b[13],
                        a[12] * b[2] + a[13] * b[6] + a[14] * b[10] + a[15] * b[14],
                        a[12] * b[3] + a[13] * b[7] + a[14] * b[11] + a[15] * b[15],
                    };
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("scalar version: {d:.4}s, ", .{elapsed_s});
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const ma = zm.loadMat(a[0..]);
                    const mb = zm.loadMat(b[0..]);
                    const r = zm.mul(ma, mb);
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("zmath version: {d:.4}s\n", .{elapsed_s});
    }
 }
 noinline fn cross3ScaleBiasBenchmark(allocator: std.mem.Allocator, comptime count: comptime_int) !void {
    std.debug.print("{s:>42} - ", .{"cross3, scale, bias benchmark (AOS)"});
    var data0 = std.ArrayList([3]f32).init(allocator);
    defer data0.deinit();
    var data1 = std.ArrayList([3]f32).init(allocator);
    defer data1.deinit();
    var i: usize = 0;
    while (i < 256) : (i += 1) {
        try data0.append([3]f32{ random.float(f32), random.float(f32), random.float(f32) });
        try data1.append([3]f32{ random.float(f32), random.float(f32), random.float(f32) });
    }
    // Warmup, fills L1 cache.
    i = 0;
    while (i < 100) : (i += 1) {
        for (data1.items) |b| {
            for (data0.items) |a| {
                const va = zm.loadArr3(a);
                const vb = zm.loadArr3(b);
                const cp = zm.f32x4s(0.01) * zm.cross3(va, vb) + zm.f32x4s(1.0);
                std.mem.doNotOptimizeAway(&cp);
            }
        }
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const r = [3]f32{
                        0.01 * (a[1] * b[2] - a[2] * b[1]) + 1.0,
                        0.01 * (a[2] * b[0] - a[0] * b[2]) + 1.0,
                        0.01 * (a[0] * b[1] - a[1] * b[0]) + 1.0,
                    };
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("scalar version: {d:.4}s, ", .{elapsed_s});
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const va = zm.loadArr3(a);
                    const vb = zm.loadArr3(b);
                    const cp = zm.f32x4s(0.01) * zm.cross3(va, vb) + zm.f32x4s(1.0);
                    std.mem.doNotOptimizeAway(&cp);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("zmath version: {d:.4}s\n", .{elapsed_s});
    }
 }
 noinline fn cross3Dot3ScaleBiasBenchmark(allocator: std.mem.Allocator, comptime count: comptime_int) !void {
    std.debug.print("{s:>42} - ", .{"cross3, dot3, scale, bias benchmark (AOS)"});
    var data0 = std.ArrayList([3]f32).init(allocator);
    defer data0.deinit();
    var data1 = std.ArrayList([3]f32).init(allocator);
    defer data1.deinit();
    var i: usize = 0;
    while (i < 256) : (i += 1) {
        try data0.append([3]f32{ random.float(f32), random.float(f32), random.float(f32) });
        try data1.append([3]f32{ random.float(f32), random.float(f32), random.float(f32) });
    }
    // Warmup, fills L1 cache.
    i = 0;
    while (i < 100) : (i += 1) {
        for (data1.items) |b| {
            for (data0.items) |a| {
                const va = zm.loadArr3(a);
                const vb = zm.loadArr3(b);
                const r = (zm.dot3(va, vb) * (zm.f32x4s(0.1) * zm.cross3(va, vb) + zm.f32x4s(1.0)))[0];
                std.mem.doNotOptimizeAway(&r);
            }
        }
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const d = a[0] * b[0] + a[1] * b[1] + a[2] * b[2];
                    const r = [3]f32{
                        d * (0.1 * (a[1] * b[2] - a[2] * b[1]) + 1.0),
                        d * (0.1 * (a[2] * b[0] - a[0] * b[2]) + 1.0),
                        d * (0.1 * (a[0] * b[1] - a[1] * b[0]) + 1.0),
                    };
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("scalar version: {d:.4}s, ", .{elapsed_s});
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const va = zm.loadArr3(a);
                    const vb = zm.loadArr3(b);
                    const r = zm.dot3(va, vb) * (zm.f32x4s(0.1) * zm.cross3(va, vb) + zm.f32x4s(1.0));
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("zmath version: {d:.4}s\n", .{elapsed_s});
    }
 }
 noinline fn quatBenchmark(allocator: std.mem.Allocator, comptime count: comptime_int) !void {
    std.debug.print("{s:>42} - ", .{"quaternion mul benchmark (AOS)"});
    var data0 = std.ArrayList([4]f32).init(allocator);
    defer data0.deinit();
    var data1 = std.ArrayList([4]f32).init(allocator);
    defer data1.deinit();
    var i: usize = 0;
    while (i < 256) : (i += 1) {
        try data0.append([4]f32{ random.float(f32), random.float(f32), random.float(f32), random.float(f32) });
        try data1.append([4]f32{ random.float(f32), random.float(f32), random.float(f32), random.float(f32) });
    }
    // Warmup, fills L1 cache.
    i = 0;
    while (i < 100) : (i += 1) {
        for (data1.items) |b| {
            for (data0.items) |a| {
                const va = zm.loadArr4(a);
                const vb = zm.loadArr4(b);
                const r = zm.qmul(va, vb);
                std.mem.doNotOptimizeAway(&r);
            }
        }
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const r = [4]f32{
                        (b[3] * a[0]) + (b[0] * a[3]) + (b[1] * a[2]) - (b[2] * a[1]),
                        (b[3] * a[1]) - (b[0] * a[2]) + (b[1] * a[3]) + (b[2] * a[0]),
                        (b[3] * a[2]) + (b[0] * a[1]) - (b[1] * a[0]) + (b[2] * a[3]),
                        (b[3] * a[3]) - (b[0] * a[0]) - (b[1] * a[1]) - (b[2] * a[2]),
                    };
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("scalar version: {d:.4}s, ", .{elapsed_s});
    }
    {
        i = 0;
        var timer = try Timer.start();
        const start = timer.lap();
        while (i < count) : (i += 1) {
            for (data1.items) |b| {
                for (data0.items) |a| {
                    const va = zm.loadArr4(a);
                    const vb = zm.loadArr4(b);
                    const r = zm.qmul(va, vb);
                    std.mem.doNotOptimizeAway(&r);
                }
            }
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("zmath version: {d:.4}s\n", .{elapsed_s});
    }
 }
 noinline fn waveBenchmark(allocator: std.mem.Allocator, comptime count: comptime_int) !void {
    _ = allocator;
    std.debug.print("{s:>42} - ", .{"wave benchmark (SOA)"});
    const grid_size = 1024;
    {
        var t: f32 = 0.0;
        const scale: f32 = 0.05;
        var timer = try Timer.start();
        const start = timer.lap();
        var iter: usize = 0;
        while (iter < count) : (iter += 1) {
            var z_index: i32 = 0;
            while (z_index < grid_size) : (z_index += 1) {
                const z = scale * @as(f32, @floatFromInt(z_index - grid_size / 2));
                var x_index: i32 = 0;
                while (x_index < grid_size) : (x_index += 4) {
                    const x0 = scale * @as(f32, @floatFromInt(x_index + 0 - grid_size / 2));
                    const x1 = scale * @as(f32, @floatFromInt(x_index + 1 - grid_size / 2));
                    const x2 = scale * @as(f32, @floatFromInt(x_index + 2 - grid_size / 2));
                    const x3 = scale * @as(f32, @floatFromInt(x_index + 3 - grid_size / 2));
                    const d0 = zm.sqrt(x0 * x0 + z * z);
                    const d1 = zm.sqrt(x1 * x1 + z * z);
                    const d2 = zm.sqrt(x2 * x2 + z * z);
                    const d3 = zm.sqrt(x3 * x3 + z * z);
                    const y0 = zm.sin(d0 - t);
                    const y1 = zm.sin(d1 - t);
                    const y2 = zm.sin(d2 - t);
                    const y3 = zm.sin(d3 - t);
                    std.mem.doNotOptimizeAway(&y0);
                    std.mem.doNotOptimizeAway(&y1);
                    std.mem.doNotOptimizeAway(&y2);
                    std.mem.doNotOptimizeAway(&y3);
                }
            }
            t += 0.001;
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("scalar version: {d:.4}s, ", .{elapsed_s});
    }
    {
        const T = zm.F32x16;
        const static = struct {
            const offsets = [16]f32{ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 };
        };
        const voffset = zm.load(static.offsets[0..], T, 0);
        var vt = zm.splat(T, 0.0);
        const scale: f32 = 0.05;
        var timer = try Timer.start();
        const start = timer.lap();
        var iter: usize = 0;
        while (iter < count) : (iter += 1) {
            var z_index: i32 = 0;
            while (z_index < grid_size) : (z_index += 1) {
                const z = scale * @as(f32, @floatFromInt(z_index - grid_size / 2));
                const vz = zm.splat(T, z);
                var x_index: i32 = 0;
                while (x_index < grid_size) : (x_index += zm.veclen(T)) {
                    const x = scale * @as(f32, @floatFromInt(x_index - grid_size / 2));
                    const vx = zm.splat(T, x) + voffset * zm.splat(T, scale);
                    const d = zm.sqrt(vx * vx + vz * vz);
                    const vy = zm.sin(d - vt);
                    std.mem.doNotOptimizeAway(&vy);
                }
            }
            vt += zm.splat(T, 0.001);
        }
        const end = timer.read();
        const elapsed_s = @as(f64, @floatFromInt(end - start)) / time.ns_per_s;
        std.debug.print("zmath version: {d:.4}s\n", .{elapsed_s});
    }
 }
--- a/libs/zmath/src/main.zig
+++ b/libs/zmath/src/main.zig
@ -0,0 +1,16 @@
 //--------------------------------------------------------------------------------------------------
 //
 // SIMD math library for game developers
 // https://github.com/michal-z/zig-gamedev/tree/main/libs/zmath
 //
 // See zmath.zig for more details.
 // See util.zig for additional functionality.
 //
 //--------------------------------------------------------------------------------------------------
 pub usingnamespace @import("zmath.zig");
 pub const util = @import("util.zig");
 // ensure transitive closure of test coverage
 comptime {
    _ = util;
 }
--- a/libs/zmath/src/util.zig
+++ b/libs/zmath/src/util.zig
@ -0,0 +1,188 @@
 // ==============================================================================
 //
 // Collection of useful functions building on top of, and extending, core zmath.
 // https://github.com/michal-z/zig-gamedev/tree/main/libs/zmath
 //
 // ------------------------------------------------------------------------------
 // 1. Matrix functions
 // ------------------------------------------------------------------------------
 //
 // As an example, in a left handed Y-up system:
 //   getAxisX is equivalent to the right vector
 //   getAxisY is equivalent to the up vector
 //   getAxisZ is equivalent to the forward vector
 //
 // getTranslationVec(m: Mat) Vec
 // getAxisX(m: Mat) Vec
 // getAxisY(m: Mat) Vec
 // getAxisZ(m: Mat) Vec
 //
 // ==============================================================================
 const zm = @import("zmath.zig");
 const std = @import("std");
 const math = std.math;
 const expect = std.testing.expect;
 pub fn getTranslationVec(m: zm.Mat) zm.Vec {
    var translation = m[3];
    translation[3] = 0;
    return translation;
 }
 pub fn setTranslationVec(m: *zm.Mat, translation: zm.Vec) void {
    const w = m[3][3];
    m[3] = translation;
    m[3][3] = w;
 }
 pub fn getScaleVec(m: zm.Mat) zm.Vec {
    const scale_x = zm.length3(zm.f32x4(m[0][0], m[1][0], m[2][0], 0))[0];
    const scale_y = zm.length3(zm.f32x4(m[0][1], m[1][1], m[2][1], 0))[0];
    const scale_z = zm.length3(zm.f32x4(m[0][2], m[1][2], m[2][2], 0))[0];
    return zm.f32x4(scale_x, scale_y, scale_z, 0);
 }
 pub fn getRotationQuat(_m: zm.Mat) zm.Quat {
    // Ortho normalize given matrix.
    const c1 = zm.normalize3(zm.f32x4(_m[0][0], _m[1][0], _m[2][0], 0));
    const c2 = zm.normalize3(zm.f32x4(_m[0][1], _m[1][1], _m[2][1], 0));
    const c3 = zm.normalize3(zm.f32x4(_m[0][2], _m[1][2], _m[2][2], 0));
    var m = _m;
    m[0][0] = c1[0];
    m[1][0] = c1[1];
    m[2][0] = c1[2];
    m[0][1] = c2[0];
    m[1][1] = c2[1];
    m[2][1] = c2[2];
    m[0][2] = c3[0];
    m[1][2] = c3[1];
    m[2][2] = c3[2];
    // Extract rotation
    return zm.quatFromMat(m);
 }
 pub fn getAxisX(m: zm.Mat) zm.Vec {
    return zm.normalize3(zm.f32x4(m[0][0], m[0][1], m[0][2], 0.0));
 }
 pub fn getAxisY(m: zm.Mat) zm.Vec {
    return zm.normalize3(zm.f32x4(m[1][0], m[1][1], m[1][2], 0.0));
 }
 pub fn getAxisZ(m: zm.Mat) zm.Vec {
    return zm.normalize3(zm.f32x4(m[2][0], m[2][1], m[2][2], 0.0));
 }
 test "zmath.util.mat.translation" {
    // zig fmt: off
    const mat_data = [18]f32{
        1.0,
        2.0, 3.0, 4.0, 5.0,
        6.0, 7.0, 8.0, 9.0,
        10.0,11.0, 12.0,13.0,
        14.0, 15.0, 16.0, 17.0,
        18.0,
    };
    // zig fmt: on
    const mat = zm.loadMat(mat_data[1..]);
    const translation = getTranslationVec(mat);
    try zm.expectVecApproxEqAbs(translation, zm.f32x4(14.0, 15.0, 16.0, 0.0), 0.0001);
 }
 test "zmath.util.mat.scale" {
    const mat = zm.mul(zm.scaling(3, 4, 5), zm.translation(6, 7, 8));
    const scale = getScaleVec(mat);
    try zm.expectVecApproxEqAbs(scale, zm.f32x4(3.0, 4.0, 5.0, 0.0), 0.0001);
 }
 test "zmath.util.mat.rotation" {
    const rotate_origin = zm.matFromRollPitchYaw(0.1, 1.2, 2.3);
    const mat = zm.mul(zm.mul(rotate_origin, zm.scaling(3, 4, 5)), zm.translation(6, 7, 8));
    const rotate_get = getRotationQuat(mat);
    const v0 = zm.mul(zm.f32x4s(1), rotate_origin);
    const v1 = zm.mul(zm.f32x4s(1), zm.quatToMat(rotate_get));
    try zm.expectVecApproxEqAbs(v0, v1, 0.0001);
 }
 test "zmath.util.mat.z_vec" {
    const degToRad = std.math.degreesToRadians;
    var identity = zm.identity();
    var z_vec = getAxisZ(identity);
    try zm.expectVecApproxEqAbs(z_vec, zm.f32x4(0.0, 0.0, 1.0, 0), 0.0001);
    const rot_yaw = zm.rotationY(degToRad(90));
    identity = zm.mul(identity, rot_yaw);
    z_vec = getAxisZ(identity);
    try zm.expectVecApproxEqAbs(z_vec, zm.f32x4(1.0, 0.0, 0.0, 0), 0.0001);
 }
 test "zmath.util.mat.y_vec" {
    const degToRad = std.math.degreesToRadians;
    var identity = zm.identity();
    var y_vec = getAxisY(identity);
    try zm.expectVecApproxEqAbs(y_vec, zm.f32x4(0.0, 1.0, 0.0, 0), 0.01);
    const rot_yaw = zm.rotationY(degToRad(90));
    identity = zm.mul(identity, rot_yaw);
    y_vec = getAxisY(identity);
    try zm.expectVecApproxEqAbs(y_vec, zm.f32x4(0.0, 1.0, 0.0, 0), 0.01);
    const rot_pitch = zm.rotationX(degToRad(90));
    identity = zm.mul(identity, rot_pitch);
    y_vec = getAxisY(identity);
    try zm.expectVecApproxEqAbs(y_vec, zm.f32x4(0.0, 0.0, 1.0, 0), 0.01);
 }
 test "zmath.util.mat.right" {
    const degToRad = std.math.degreesToRadians;
    var identity = zm.identity();
    var right = getAxisX(identity);
    try zm.expectVecApproxEqAbs(right, zm.f32x4(1.0, 0.0, 0.0, 0), 0.01);
    const rot_yaw = zm.rotationY(degToRad(90));
    identity = zm.mul(identity, rot_yaw);
    right = getAxisX(identity);
    try zm.expectVecApproxEqAbs(right, zm.f32x4(0.0, 0.0, -1.0, 0), 0.01);
    const rot_pitch = zm.rotationX(degToRad(90));
    identity = zm.mul(identity, rot_pitch);
    right = getAxisX(identity);
    try zm.expectVecApproxEqAbs(right, zm.f32x4(0.0, 1.0, 0.0, 0), 0.01);
 }
 // ------------------------------------------------------------------------------
 // This software is available under 2 licenses -- choose whichever you prefer.
 // ------------------------------------------------------------------------------
 // ALTERNATIVE A - MIT License
 // Copyright (c) 2022 Michal Ziulek and Contributors
 // Permission is hereby granted, free of charge, to any person obtaining identity copy of
 // this software and associated documentation files (the "Software"), to deal in
 // the Software without restriction, including without limitation the rights to
 // use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
 // of the Software, and to permit persons to whom the Software is furnished to do
 // so, subject to the following conditions:
 // The above copyright notice and this permission notice shall be included in all
 // copies or substantial portions of the Software.
 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 // SOFTWARE.
 // ------------------------------------------------------------------------------
 // ALTERNATIVE B - Public Domain (www.unlicense.org)
 // This is free and unencumbered software released into the public domain.
 // Anyone is free to copy, modify, publish, use, compile, sell, or distribute this
 // software, either in source code form or as identity compiled binary, for any purpose,
 // commercial or non-commercial, and by any means.
 // In jurisdictions that recognize copyright laws, the author or authors of this
 // software dedicate any and all copyright interest in the software to the public
 // domain. We make this dedication for the benefit of the public at large and to
 // the detriment of our heirs and successors. We intend this dedication to be an
 // overt act of relinquishment in perpetuity of all present and future rights to
 // this software under copyright law.
 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 // AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 // ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
 // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 // ------------------------------------------------------------------------------
--- a/libs/zmath/src/zmath.zig
+++ b/libs/zmath/src/zmath.zig
--- a/src/main.zig
+++ b/src/main.zig
@ -1,7 +1,10 @@
 const std = @import("std");
 const vk = @import("vulkan");
 const sdl = @import("sdl2");
 const zm = @import("zmath");
 const VulkanRenderer = @import("vulkan_renderer.zig").VulkanRenderer;
 const Vector3 = @import("utilities.zig").Vector3;
 pub fn main() !void {
    const window = try initWindow();
@ -16,6 +19,11 @@ pub fn main() !void {
    var vulkan_renderer = try VulkanRenderer.init(window, allocator);
    defer vulkan_renderer.deinit();
    var angle: f32 = 0.0;
    var now: u64 = sdl.getPerformanceCounter();
    var last: u64 = 0;
    var delta_time: f32 = 0.0;
    mainLoop: while (true) {
        while (sdl.pollEvent()) |ev| {
            switch (ev) {
@ -29,6 +37,18 @@ pub fn main() !void {
            }
        }
        last = now;
        now = sdl.getPerformanceCounter();
        delta_time = @as(f32, @floatFromInt(now - last)) * 1000.0 / @as(f32, @floatFromInt(now));
        angle += 10.0 * delta_time;
        if (angle > 360.0) {
            angle -= 360.0;
        }
        try vulkan_renderer.updateModel(zm.rotationZ(angle));
        try vulkan_renderer.draw();
    }
 }
--- a/src/shaders/shader.vert
+++ b/src/shaders/shader.vert
@ -3,9 +3,15 @@
 layout(location = 0) in vec3 pos;
 layout(location = 1) in vec3 col;
 layout(binding = 0) uniform MVP {
    mat4 projection;
    mat4 view;
    mat4 model;
 } mvp;
 layout(location = 0) out vec3 fragCol;
 void main() {
-    gl_Position = vec4(pos, 1.0);
+    gl_Position = mvp.projection * mvp.view * mvp.model * vec4(pos, 1.0);
    fragCol = col;
 }
--- a/src/vulkan_renderer.zig
+++ b/src/vulkan_renderer.zig
@ -3,6 +3,7 @@ const sdl = @import("sdl2");
 const vk = @import("vulkan");
 const builtin = @import("builtin");
 const shaders = @import("shaders");
 const zm = @import("zmath");
 const Utilities = @import("utilities.zig");
 const QueueFamilyIndices = Utilities.QueueFamilyIndices;
@ -39,6 +40,12 @@ pub const CommandBuffer = vk.CommandBufferProxy(apis);
 pub const VulkanRenderer = struct {
    const Self = @This();
    const Mvp = struct {
        projection: zm.Mat,
        view: zm.Mat,
        model: zm.Mat,
    };
    allocator: std.mem.Allocator,
    vkb: BaseDispatch,
@ -50,6 +57,9 @@ pub const VulkanRenderer = struct {
    // Scene objects
    meshes: [2]Mesh,
    // Scene settings
    mvp: Mvp,
    // Main
    instance: Instance,
    physical_device: vk.PhysicalDevice,
@ -65,6 +75,15 @@ pub const VulkanRenderer = struct {
    swapchain_framebuffers: []vk.Framebuffer,
    command_buffers: []CommandBuffer,
    // Descriptors
    descriptor_set_layout: vk.DescriptorSetLayout,
    descriptor_pool: vk.DescriptorPool,
    descriptor_sets: []vk.DescriptorSet,
    uniform_buffer: []vk.Buffer,
    uniform_buffer_memory: []vk.DeviceMemory,
    // Pipeline
    graphics_pipeline: vk.Pipeline,
    pipeline_layout: vk.PipelineLayout,
@ -103,10 +122,28 @@ pub const VulkanRenderer = struct {
        try self.createLogicalDevice();
        try self.createSwapchain();
        try self.createRenderPass();
        try self.createDescriptorSetLayout();
        try self.createGraphicsPipeline();
        try self.createFramebuffers();
        try self.createCommandPool();
        const aspect: f32 = @as(f32, @floatFromInt(self.extent.width)) / @as(f32, @floatFromInt(self.extent.height));
        self.mvp.projection = zm.perspectiveFovRh(
            std.math.degreesToRadians(45.0),
            aspect,
            0.1,
            100.0,
        );
        self.mvp.view = zm.lookAtRh(
            zm.Vec{ 0.0, 0.0, 2.0, 0.0 },
            zm.Vec{ 0.0, 0.0, 0.0, 0.0 },
            zm.Vec{ 0.0, 1.0, 0.0, 0.0 },
        );
        self.mvp.model = zm.identity();
        // Invert y scale
        self.mvp.projection[1][1] *= -1;
        // Create meshes
        // Vertex Data
        var mesh_vertices = [_]Vertex{
@ -154,12 +191,21 @@ pub const VulkanRenderer = struct {
        self.meshes = [_]Mesh{ first_mesh, second_mesh };
        try self.createCommandBuffers();
        try self.createUniformBuffers();
        try self.createDescriptorPool();
        try self.createDescriptorSets();
        try self.recordCommands();
        try self.createSynchronisation();
        return self;
    }
    pub fn updateModel(self: *Self, new_model: zm.Mat) !void {
        self.mvp.model = new_model;
    }
    pub fn draw(self: *Self) !void {
        // Wait for given fence to signal (open) from last draw before continuing
        _ = try self.device.waitForFences(1, @ptrCast(&self.draw_fences[self.current_frame]), vk.TRUE, std.math.maxInt(u64));
@ -175,6 +221,8 @@ pub const VulkanRenderer = struct {
            .null_handle,
        );
        try self.updateUniformBuffer(image_index_result.image_index);
        // -- Submit command buffer to render
        // Queue submission information
        const wait_stages = [_]vk.PipelineStageFlags{.{ .color_attachment_output_bit = true }};
@ -215,6 +263,17 @@ pub const VulkanRenderer = struct {
            self.instance.destroyDebugUtilsMessengerEXT(self.debug_utils.?, null);
        }
        self.device.destroyDescriptorPool(self.descriptor_pool, null);
        self.device.destroyDescriptorSetLayout(self.descriptor_set_layout, null);
        for (self.uniform_buffer, self.uniform_buffer_memory) |buffer, buffer_memory| {
            self.device.destroyBuffer(buffer, null);
            self.device.freeMemory(buffer_memory, null);
        }
        self.allocator.free(self.uniform_buffer);
        self.allocator.free(self.uniform_buffer_memory);
        self.allocator.free(self.descriptor_sets);
        for (self.meshes) |mesh| {
            mesh.destroyBuffers();
        }
@ -491,6 +550,26 @@ pub const VulkanRenderer = struct {
        self.render_pass = try self.device.createRenderPass(&render_pass_create_info, null);
    }
    fn createDescriptorSetLayout(self: *Self) !void {
        // MVP binding info
        const mvp_layout_binding: vk.DescriptorSetLayoutBinding = .{
            .binding = 0, // Binding point in shader (designated by binding number in shader)
            .descriptor_type = .uniform_buffer, // Type of descriptor (unifor, dynamic uniform, image sampler, etc)
            .descriptor_count = 1, // Number of descriptors for binding
            .stage_flags = .{ .vertex_bit = true }, // Shader stage to bind to
            .p_immutable_samplers = null, // For texture: can make smapler data immutable by specifying in layout
        };
        // Create descriptor set layout with given bindings
        const layout_create_info: vk.DescriptorSetLayoutCreateInfo = .{
            .binding_count = 1, // Number of binding infos
            .p_bindings = @ptrCast(&mvp_layout_binding), // Array of binding infos
        };
        // Create descriptor set layout
        self.descriptor_set_layout = try self.device.createDescriptorSetLayout(&layout_create_info, null);
    }
    fn createGraphicsPipeline(self: *Self) !void {
        // Create shader modules
        const vert = try self.device.createShaderModule(&.{
@ -606,7 +685,7 @@ pub const VulkanRenderer = struct {
            .polygon_mode = .fill, // How to handle filling points between vertices
            .line_width = 1.0, // How thick the lines should be when drawn
            .cull_mode = .{ .back_bit = true }, // Which face of a triangle to cull
-            .front_face = .clockwise, // Winding to determine which side is front
+            .front_face = .counter_clockwise, // Winding to determine which side is front
            .depth_bias_enable = vk.FALSE, // Whether to add depth bias to fragments (good for stopping "shadow acne" in shadow mapping)
            .depth_bias_constant_factor = 0,
            .depth_bias_clamp = 0,
@ -647,8 +726,11 @@ pub const VulkanRenderer = struct {
            .blend_constants = [_]f32{ 0, 0, 0, 0 },
        };
-        // -- Pipeline layout (TODO: Apply future descriptor set layouts) --
+        // -- Pipeline layout --
-        const pipeline_layout_create_info: vk.PipelineLayoutCreateInfo = .{};
+        const pipeline_layout_create_info: vk.PipelineLayoutCreateInfo = .{
            .set_layout_count = 1,
            .p_set_layouts = @ptrCast(&self.descriptor_set_layout),
        };
        self.pipeline_layout = try self.device.createPipelineLayout(&pipeline_layout_create_info, null);
@ -748,6 +830,101 @@ pub const VulkanRenderer = struct {
        }
    }
    fn createUniformBuffers(self: *Self) !void {
        // Buffer size will be size of all three variables (will offset to access)
        const buffer_size: vk.DeviceSize = @sizeOf(@TypeOf(self.mvp));
        // One uniform buffer for each image (and by extension, command buffer)
        self.uniform_buffer = try self.allocator.alloc(vk.Buffer, self.swapchain_images.len);
        self.uniform_buffer_memory = try self.allocator.alloc(vk.DeviceMemory, self.swapchain_images.len);
        // Create the uniform buffers
        for (0..self.uniform_buffer.len) |i| {
            try Utilities.createBuffer(
                self.physical_device,
                self.instance,
                self.device,
                buffer_size,
                .{ .uniform_buffer_bit = true },
                .{ .host_visible_bit = true, .host_coherent_bit = true },
                &self.uniform_buffer[i],
                &self.uniform_buffer_memory[i],
            );
        }
    }
    fn createDescriptorPool(self: *Self) !void {
        // Type of descriptors + how many descriptors (!= descriptor sets) (combined makes the pool size)
        const pool_size: vk.DescriptorPoolSize = .{
            .type = .uniform_buffer,
            .descriptor_count = @intCast(self.uniform_buffer.len),
        };
        // Data to create descriptor pool
        const pool_create_info: vk.DescriptorPoolCreateInfo = .{
            .max_sets = @intCast(self.uniform_buffer.len), // Maximum number of descriptor sets that can be created from pool
            .pool_size_count = 1, // Amount of pool sizes being passed
            .p_pool_sizes = @ptrCast(&pool_size), // Pool sizes to create pool with
        };
        // Create descriptor pool
        self.descriptor_pool = try self.device.createDescriptorPool(&pool_create_info, null);
    }
    fn createDescriptorSets(self: *Self) !void {
        // One descriptor set for every buffer
        self.descriptor_sets = try self.allocator.alloc(vk.DescriptorSet, self.uniform_buffer.len);
        var set_layouts = try self.allocator.alloc(vk.DescriptorSetLayout, self.uniform_buffer.len);
        defer self.allocator.free(set_layouts);
        for (0..set_layouts.len) |i| {
            set_layouts[i] = self.descriptor_set_layout;
        }
        // Descriptor set allocation info
        const set_alloc_info: vk.DescriptorSetAllocateInfo = .{
            .descriptor_pool = self.descriptor_pool, // Pool to allocate descriptor set from
            .descriptor_set_count = @intCast(self.descriptor_sets.len), // Number of sets to allocate
            .p_set_layouts = set_layouts.ptr, // Layouts to use to allocate sets (1:1 relationship)
        };
        // Allocate descriptor sets (multiple)
        try self.device.allocateDescriptorSets(&set_alloc_info, self.descriptor_sets.ptr);
        // Update all of descriptor set buffer bindings
        for (0..self.descriptor_sets.len) |i| {
            // Buffer info and data offset info
            const mvp_buffer_info: vk.DescriptorBufferInfo = .{
                .buffer = self.uniform_buffer[i], // Bufer to get data from
                .offset = 0, // Position of start of data
                .range = @sizeOf(@TypeOf(self.mvp)), // Size of data
            };
            // Data about connection between binding and buffer
            const mvp_set_write: vk.WriteDescriptorSet = .{
                .dst_set = self.descriptor_sets[i], // Descriptor set to update
                .dst_binding = 0, // Binding to update (matches with binding on layout/shader)
                .dst_array_element = 0, // Index in array to update
                .descriptor_type = .uniform_buffer, // Type of descriptor
                .descriptor_count = 1, // Amount to update
                .p_buffer_info = @ptrCast(&mvp_buffer_info), // Information about buffer data to bind
                .p_image_info = undefined,
                .p_texel_buffer_view = undefined,
            };
            // Update the descriptor sets with new buffer/binding info
            self.device.updateDescriptorSets(1, @ptrCast(&mvp_set_write), 0, null);
        }
    }
    fn updateUniformBuffer(self: Self, image_index: u32) !void {
        const data = try self.device.mapMemory(self.uniform_buffer_memory[image_index], 0, @sizeOf(Mvp), .{});
        const mvp_data: *Mvp = @ptrCast(@alignCast(data));
        mvp_data.* = self.mvp;
        self.device.unmapMemory(self.uniform_buffer_memory[image_index]);
    }
    fn recordCommands(self: *Self) !void {
        // Information about how to begin each command
        const buffer_begin_info: vk.CommandBufferBeginInfo = .{
@ -799,6 +976,17 @@ pub const VulkanRenderer = struct {
                    // Bind mesh index buffer, with 0 offset and using the uint32 type
                    command_buffer.bindIndexBuffer(mesh.index_buffer, 0, .uint32);
                    // Bind descriptor sets
                    command_buffer.bindDescriptorSets(
                        .graphics,
                        self.pipeline_layout,
                        0,
                        1,
                        @ptrCast(&self.descriptor_sets[i]),
                        0,
                        null,
                    );
                    // Execute a pipeline
                    command_buffer.drawIndexed(mesh.index_count, 1, 0, 0, 0);
                }