summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--c2.cpp32
-rw-r--r--convmodel.c3
-rw-r--r--intermediate/surface.glsl51
-rw-r--r--model.cpp28
-rw-r--r--model.hpp2
-rw-r--r--pipeline.cpp13
-rw-r--r--sc/sc.cpp219
-rw-r--r--video.cpp173
-rw-r--r--video.hpp8
9 files changed, 400 insertions, 129 deletions
diff --git a/c2.cpp b/c2.cpp
index 58e33ff..1f55c15 100644
--- a/c2.cpp
+++ b/c2.cpp
@@ -60,33 +60,6 @@ static Buffer_Id upload_verts(Device* dev) {
return vbo;
}
-Texture_Id make_default_texture(Device* dev) {
- unsigned* mem;
- Texture_Id tex;
- Buffer_Id buf = dev->create_buffer(
- "default texture stage",
- 4,
- Buffer_Flags::copy_src |
- Buffer_Flags::cpu_readwrite
- );
- mem = (unsigned*)dev->map_buffer(buf, 0, 4);
- mem[0] = 0xffffffff;
- dev->unmap_buffer(buf);
- tex = dev->create_texture(
- "default PBR texture",
- texture_format_rgba8i,
- Texture_Flags::sampleable | Texture_Flags::copy_dst,
- 1,
- 1,
- 1,
- 1,
- 1,
- buf
- );
- dev->destroy_bufferi(buf);
- return tex;
-}
-
static Sampler_Id create_clamped_linear(Device* dev) {
Sampler_State s{};
s.min = Filter_Mode::linear;
@@ -642,7 +615,6 @@ struct C2 : public App {
Collider* box_col, * floor_col;
Texture* texture;
Texture* texture2;
- Texture_Id default_texture;
Entity_Id monkey, monkey2, box, floor;
Model_Scene scene;
Renderer renderer;
@@ -694,11 +666,10 @@ struct C2 : public App {
);
assets.init(&asset_arena, "pack", 128);
dev = Device::create(&video_arena, this);
- default_texture = make_default_texture(dev);
make_hdr_target();
make_ui_texture();
model_loader.init(dev, &assets);
- mat_loader.init(&assets, default_texture);
+ mat_loader.init(&assets);
register_asset_loader("MODL", &model_loader);
register_asset_loader("MTRL", &mat_loader);
shader = (Shader*)assets.load("triangle.csh");
@@ -1035,7 +1006,6 @@ struct C2 : public App {
ui->destroy();
deinit_editor();
assets.destroy();
- dev->destroy_texture(default_texture);
dev->destroy_texture(hdr_target);
dev->destroy_texture(hdr_resolved);
dev->destroy_texture(ms_depth);
diff --git a/convmodel.c b/convmodel.c
index 31a062d..89f65c8 100644
--- a/convmodel.c
+++ b/convmodel.c
@@ -332,7 +332,7 @@ Shader_Attrib* parse_shader_attribs(const char* fname) {
FILE* f;
char magic[4];
int type, i;
- int binding_count, target_count, desc_count;
+ int binding_count, target_count, desc_count, opt_count;
char* fpath = arena_alloc(
&arena,
string_len(fname) +
@@ -362,6 +362,7 @@ Shader_Attrib* parse_shader_attribs(const char* fname) {
fread(&binding_count, 4, 1, f);
fread(&target_count, 4, 1, f);
fread(&desc_count, 4, 1, f);
+ fread(&opt_count, 4, 1, f);
assert(binding_count);
for (i = 0; i < binding_count; i++) {
char name[24];
diff --git a/intermediate/surface.glsl b/intermediate/surface.glsl
index ce80259..cc287e4 100644
--- a/intermediate/surface.glsl
+++ b/intermediate/surface.glsl
@@ -9,6 +9,22 @@ fragment: main
#ifdef DESC
+[option]
+name: albedomap
+stage: fragment
+[option]
+name: aomap
+stage: fragment
+[option]
+name: metalmap
+stage: fragment
+[option]
+name: roughmap
+stage: fragment
+[option]
+name: normalmap
+stage: fragment
+
[binding]
name: mesh
rate: vertex
@@ -142,8 +158,8 @@ void main() {
#define pi 3.14159265358979323846
-vec3 diffuse_brdf(vec2 uv) {
- vec3 a = material.albedo * texture(albedo, uv).rgb;
+vec3 diffuse_brdf(vec2 uv, vec3 base) {
+ vec3 a = base;
return a / pi;
}
@@ -157,7 +173,11 @@ float specular_G1(float a, vec3 v, vec3 n) {
float specular_brdf(vec2 uv, vec3 ref, vec3 l, vec3 v, vec3 n) {
float ndl = max(dot(n, l), 0.0);
float ndv = max(dot(n, v), 0.0);
+#if OPT_roughmap
float a = texture(rough, uv).r * material.roughness;
+#else
+ float a = material.roughness;
+#endif
float a2 = a * a;
float ndr = max(dot(n, ref), 0.0);
float b = ((ndr * ndr) * (a2 - 1) + 1);
@@ -244,26 +264,41 @@ void main() {
vec2 uv = interpolator.uv;
vec3 p = interpolator.position.xyz;
+#if OPT_normalmap
vec3 nrmsample = texture(normal, uv).rgb;
vec2 nrmxy = nrmsample.xy * 2.0 - 1.0;
vec3 nrm = normalize(vec3(nrmxy, 1.0));
- if (nrmsample.b == 1.0) /* default texture */
- nrm = normalize(interpolator.tbn[2]);
- else
- nrm = normalize(interpolator.tbn * nrm);
+ nrm = normalize(interpolator.tbn * nrm);
+#else
+ vec3 nrm = normalize(interpolator.tbn[2]);
+#endif
+#if OPT_albedomap
vec3 col = texture(albedo, uv).rgb * material.albedo;
- vec3 view_dir = normalize(globals.camera_pos - p);
+#else
+ vec3 col = material.albedo;
+#endif
+
+#if OPT_metalmap
float met = texture(metal, uv).r * material.metalness;
+#else
+ float met = material.metalness;
+#endif
+
+ vec3 view_dir = normalize(globals.camera_pos - p);
vec3 ref = reflect(-view_dir, nrm);
vec3 ref_col = texture(env_cube, ref, material.roughness * 8.0).rgb;
vec3 spec_col = mix(ref_col, ref_col * col, met);
vec3 amb_col = min(textureLod(env_cube, nrm, 8.0).rgb, 0.05);
+#if OPT_aomap
vec3 ambient =
amb_col *
texture(ao, uv).r * material.ao;
+#else
+ vec3 ambient = amb_col * material.ao;
+#endif
- vec3 base_diffuse = diffuse_brdf(uv) * (1.0 - met);
+ vec3 base_diffuse = diffuse_brdf(uv, col) * (1.0 - met);
vec3 light = 0.0.xxx;
e = globals.sun_irange.y;
diff --git a/model.cpp b/model.cpp
index 6aba19e..ed6e968 100644
--- a/model.cpp
+++ b/model.cpp
@@ -32,20 +32,26 @@ void Material::use(
Sampler_Id sampler,
Shader& shader
) {
- auto bind = [&shader, &pb, sampler](
+ int opt = 0;
+ auto bind = [&shader, &pb, &opt, sampler](
const char* name,
+ const char* optname,
Texture_Id t
) {
int loc = shader.descriptor_binding(name);
if (loc >= 0) {
- pb.texture(loc, t, sampler);
+ if (t) {
+ pb.texture(loc, t, sampler);
+ opt |= shader.opt_mask(shader_type_fragment, optname);
+ }
}
};
- bind("albedo", tex.albedo);
- bind("ao", tex.ao);
- bind("metal", tex.metal);
- bind("rough", tex.rough);
- bind("normal", tex.normal);
+ bind("albedo", "albedomap", tex.albedo);
+ bind("ao", "aomap", tex.ao);
+ bind("metal", "metalmap", tex.metal);
+ bind("rough", "roughmap", tex.rough);
+ bind("normal", "normalmap", tex.normal);
+ pb.option(shader_type_fragment, opt);
}
void Model_Loader::init(Device* device, Asset_Arena* shader_arena) {
@@ -214,10 +220,8 @@ void Model::update_transforms() {
}
void Material_Loader::init(
- Asset_Arena* texture_arena,
- Texture_Id dt
+ Asset_Arena* texture_arena
) {
- default_tex = dt;
textures = texture_arena;
}
@@ -235,11 +239,11 @@ Asset* Material_Loader::load(
return r;
};
auto read_tex = [&](int len) {
- if (!len) return default_tex;
+ if (!len) return Texture_Id(0);
const char* name = read_name(len);
auto t = (Texture*)textures->load(name);
if (!t)
- return default_tex;
+ return Texture_Id(0);
return t->id;
};
(void)filename;
diff --git a/model.hpp b/model.hpp
index 75e310e..3ededa7 100644
--- a/model.hpp
+++ b/model.hpp
@@ -85,7 +85,7 @@ struct Model_Loader : public Asset_Loader {
struct Material_Loader : public Asset_Loader {
Asset_Arena* textures;
Texture_Id default_tex;
- void init(Asset_Arena* texture_arena, Texture_Id dt);
+ void init(Asset_Arena* texture_arena);
Asset* load(
Arena* a,
Arena* s,
diff --git a/pipeline.cpp b/pipeline.cpp
index 374dad8..4d34ebd 100644
--- a/pipeline.cpp
+++ b/pipeline.cpp
@@ -254,6 +254,14 @@ Pipeline_Builder& Pipeline_Builder::shader(Shader_Id s) {
return *this;
}
+Pipeline_Builder& Pipeline_Builder::option(
+ Shader_Type type,
+ int mask
+) {
+ pip->shader_masks[type] = mask;
+ return *this;
+}
+
Pipeline_Builder& Pipeline_Builder::texture(
int binding,
Texture_Id t,
@@ -321,6 +329,7 @@ Pipeline& Pipeline_Builder::build() {
}
void Pipeline::hash() {
+ int i;
#define h(n, v) \
n = fnv1a64_2(n, (uint8_t*)&v, sizeof v)
pipeline_hash = fnv1a64(0, 0);
@@ -347,8 +356,10 @@ void Pipeline::hash() {
h(pipeline_hash, blend_src_alpha);
h(pipeline_hash, blend_dst_alpha);
h(pipeline_hash, cull_mode);
+ for (i = 0; i < shader_type_count; i++)
+ h(pipeline_hash, shader_masks[i]);
{
- int i, e = descriptor_count;
+ int e = descriptor_count;
descriptor_resource_hash = fnv1a64(0, 0);
for (i = 0; i < e; i++) {
Descriptor* d = &descriptors[i];
diff --git a/sc/sc.cpp b/sc/sc.cpp
index f0ce0ff..69a7377 100644
--- a/sc/sc.cpp
+++ b/sc/sc.cpp
@@ -225,6 +225,10 @@ struct Desc {
int stage;
std::string strct;
};
+ struct Option {
+ int stage;
+ int mask;
+ };
int type;
std::vector<Binding> bindings;
std::vector<Variable> trgts;
@@ -233,8 +237,10 @@ struct Desc {
std::unordered_map<std::string, Texture> textures;
std::unordered_map<std::string, CBuffer> cbuffers;
std::unordered_map<std::string, SBuffer> sbuffers;
+ std::unordered_map<std::string, Option> options;
std::vector<Descriptor> descriptors;
std::string entrypoints[shader_type_count];
+ int copts[shader_type_count];
void read_var(Variable& d, cfg_Object* desc) {
const char* sname = find_string_default(desc, "name", 0);
if (!sname) {
@@ -397,10 +403,40 @@ struct Desc {
buf.stage |= 1 << stage_from_string(sstage);
}
+ void read_opt(cfg_Object* desc) {
+ const char* sname = find_string_default(desc, "name", 0);
+ if (!sname) {
+ print_err("%s must have a name.\n", desc->name);
+ pbreak(1001);
+ }
+ const char* sstage = find_string_default(desc, "stage", 0);
+ if (!sstage) {
+ print_err("%s must define a stage.\n", sname);
+ pbreak(1002);
+ }
+ std::string n(sname);
+ if (n.size() > 23) {
+ print_err("Option name %s is too long (max 23 chars).\n", sname);
+ pbreak(1003);
+ }
+ if (!options.contains(n)) {
+ Option& o = options[n];
+ o.mask = 0;
+ o.stage = 0;
+ }
+ int stage = stage_from_string(sstage);
+ Option& opt = options[n];
+ opt.stage |= 1 << stage;
+ opt.mask = copts[stage];
+ copts[stage] <<= 1;
+ }
+
void build(cfg_Object* desc) {
int i;
Binding* cur_binding = 0;
type = get_program_type(desc);
+ for (i = 0; i < shader_type_count; i++)
+ copts[i] = 1;
if (type != sprogram_type_graphics) {
assert(0); /* todo */
return;
@@ -450,6 +486,8 @@ struct Desc {
} else if (!strcmp(desc->name, "struct")) {
desc = read_struct(desc);
continue;
+ } else if (!strcmp(desc->name, "option")) {
+ read_opt(desc);
}
desc = desc->next;
}
@@ -628,22 +666,35 @@ std::vector<uint32_t> compile_shader(
const char* src,
const char* define,
int stage,
+ int opt,
EShLanguage lang
) {
std::string vars = d.build_vs();
- const char* srcs[] = {
+ std::vector<const char*> srcs = {
glsl_version_s, "\n",
"#define ", define, "\n",
builtin_src,
- presrc,
- src
+ presrc
};
- const char* src_names[] = {
+ std::vector<const char*> src_names = {
sname, sname,
sname, sname, sname,
- sname, sname, sname
+ sname, sname
};
- static_assert(sizeof srcs == sizeof src_names);
+ for (const auto& p : d.options) {
+ const auto& o = p.second;
+ std::string def = "#define OPT_" + p.first + " ";
+ if (opt & o.mask)
+ def += "1\n";
+ else
+ def += "0\n";
+ /* memory leak lol */
+ srcs.push_back(strdup(def.c_str()));
+ src_names.push_back(sname);
+ }
+ srcs.push_back(src);
+ src_names.push_back(sname);
+ assert(src_names.size() == srcs.size());
glslang::TShader shader(lang);
glslang::TProgram program;
glslang::TIntermediate* ir;
@@ -663,10 +714,10 @@ std::vector<uint32_t> compile_shader(
#endif
EShMessages msg = (EShMessages)(EShMsgSpvRules | EShMsgVulkanRules);
shader.setStringsWithLengthsAndNames(
- srcs,
+ &srcs[0],
0,
- src_names,
- sizeof srcs / sizeof *srcs
+ &src_names[0],
+ src_names.size()
);
shader.setEnvClient(glslang::EShClientVulkan, client_version);
shader.setEnvTarget(glslang::EShTargetSpv, target_version);
@@ -736,10 +787,23 @@ void configure(
}
}
+struct H_Variant {
+ int o = -1, s;
+ int mask;
+ int pad = 0;
+};
+struct H_Option {
+ char name[24] = { 0 };
+ int mask;
+ int stage;
+};
+static_assert(sizeof(H_Variant) == 16);
+using Variant_Map = std::unordered_map<int, std::vector<uint32_t>>;
+
void compile_shaders(
const char* sname,
const char* fname,
- std::vector<uint32_t>* spv,
+ Variant_Map* spv,
const char* src,
Desc& d
) {
@@ -747,19 +811,40 @@ void compile_shaders(
EShLanguage lang;
int i;
for (i = 0; i < shader_type_count; i++) {
+ int sm = 1 << i;
if (!d.entrypoints[i].empty()) {
std::string ps;
+ int opt = 0, j;
configure(d, i, define, lang, ps);
- spv[i] = compile_shader(
- d,
- sname,
- fname,
- ps.c_str(),
- src,
- define,
- i,
- lang
- );
+ for (const auto& p : d.options) {
+ if (~p.second.stage & sm) continue;
+ opt |= p.second.mask;
+ }
+ for (j = 0; j <= opt; j++) {
+ spv[i][j] = compile_shader(
+ d,
+ sname,
+ fname,
+ ps.c_str(),
+ src,
+ define,
+ i,
+ j,
+ lang
+ );
+ }
+ if (!opt)
+ spv[i][0] = compile_shader(
+ d,
+ sname,
+ fname,
+ ps.c_str(),
+ src,
+ define,
+ i,
+ 0,
+ lang
+ );
}
}
}
@@ -767,10 +852,14 @@ void compile_shaders(
void write_csh(
const char* fname,
const Desc& d,
- const std::vector<uint32_t>* stages
+ Variant_Map* stages
) {
- int hsize = 20, i, coff;
+ int hsize = 24, i, coff;
FILE* f = fopen(fname, "wb");
+ H_Variant* variants[shader_type_count];
+ H_Option* hopts = 0;
+ int vc[shader_type_count];
+ std::vector<const std::vector<uint32_t>*> order;
if (!f) {
print_err("Failed to open %s\n", fname);
pbreak(500);
@@ -781,6 +870,7 @@ void write_csh(
c = d.bindings.size(); fwrite(&c, 4, 1, f);
c = d.trgts.size(); fwrite(&c, 4, 1, f);
c = d.descriptors.size(); fwrite(&c, 4, 1, f);
+ c = d.options.size(); fwrite(&c, 4, 1, f);
for (const auto& b : d.bindings) {
char buf[24];
int count = b.attrs.size();
@@ -816,36 +906,79 @@ void write_csh(
fwrite(&d.stage, 4, 1, f);
hsize += 32;
}
- hsize += shader_type_count * 32;
- for (i = 0, coff = 0; i < shader_type_count; i++) {
- int o = 0;
- char buf[24];
- memset(buf, 0, sizeof buf);
- if (d.entrypoints[i].empty()) {
- fwrite(&o, 4, 1, f);
- fwrite(&o, 4, 1, f);
- } else {
- int size = stages[i].size() * sizeof(uint32_t);
- strcpy(buf, d.entrypoints[i].c_str());
- o = hsize + coff;
- fwrite(&o, 4, 1, f);
- fwrite(&size, 4, 1, f);
- coff += size;
+ if (d.options.size())
+ hopts = new H_Option[d.options.size()];
+ for (const auto& p : d.options) {
+ const auto& name = p.first;
+ const auto& o = p.second;
+ int count = d.options.size();
+ int j, bucket = (int)(
+ hash_string(name.c_str()) %
+ count
+ );
+ for (j = 0; j < count; j++) {
+ auto& ho = hopts[j];
+ if (!ho.name[0]) {
+ strcpy(ho.name, name.c_str());
+ ho.mask = o.mask;
+ ho.stage = o.stage;
+ goto oklmao;
+ }
+ bucket = (bucket + 1) % count;
}
- fwrite(buf, 1, sizeof buf, f);
+ assert(0);
+ oklmao:
+ hsize += 32;
}
- for (i = 0; i < shader_type_count; i++)
- if (!d.entrypoints[i].empty()) {
- auto& stage = stages[i];
- fwrite(&stage[0], sizeof(uint32_t), stage.size(), f);
+ fwrite(hopts, sizeof *hopts, d.options.size(), f);
+ delete[] hopts;
+ for (i = 0; i < shader_type_count; i++) {
+ vc[i] = stages[i].size();
+ hsize += vc[i] * 16 + 4;
+ variants[i] = new H_Variant[vc[i]];
+ }
+ for (i = 0, coff = 0; i < shader_type_count; i++) {
+ fwrite(&vc[i], 4, 1, f);
+ for (const auto& p : stages[i]) {
+ int mask = p.first, j;
+ int bucket = (int)(
+ fnv1a64((uint8_t*)&mask, sizeof mask) %
+ vc[i]
+ );
+ for (j = 0; j < vc[i]; j++) {
+ H_Variant& v = variants[i][bucket];
+ if (v.o == -1) {
+ auto& arr = p.second;
+ v.o = coff + hsize;
+ v.s = arr.size() * sizeof(uint32_t);
+ v.mask = mask;
+ coff += v.s;
+ order.push_back(&arr);
+ goto done;
+ }
+ bucket = (bucket + 1) % vc[i];
+ }
+ assert(0);
+ done:;
}
+ fwrite(variants[i], sizeof(H_Variant), vc[i], f);
+ delete[] variants[i];
+ }
+ for (auto bytecode : order) {
+ fwrite(
+ &(*bytecode)[0],
+ sizeof(uint32_t),
+ bytecode->size(),
+ f
+ );
+ }
}
int main(int argc, const char** argv) {
char* src;
size_t src_size;
std::string desc_src;
- std::vector<uint32_t> spv[shader_type_count];
+ Variant_Map spv[shader_type_count];
cfg_Object* cdesc;
void* dp_mem;
Desc desc;
diff --git a/video.cpp b/video.cpp
index 9e2699e..b4c5897 100644
--- a/video.cpp
+++ b/video.cpp
@@ -430,6 +430,12 @@ enum {
context_state_init = 1 << 1
};
+
+struct Shader_Module {
+ int mask;
+ VkShaderModule mod;
+};
+
struct Shader_Vk : public Shader, public Late_Terminated {
struct Attribute {
char name[28];
@@ -464,23 +470,31 @@ struct Shader_Vk : public Shader, public Late_Terminated {
int stage;
};
+ struct Option {
+ char name[24];
+ int mask;
+ int stage;
+ };
+
SProgram_Type type;
- VkShaderModule modules[shader_type_count];
- char entrypoints[shader_type_count][24];
Vertex_Format vfd;
Desc* descs;
- int desc_count;
+ Shader_Module* modules[shader_type_count];
+ Option* options;
+ int desc_count, opt_count;
+ int module_count[shader_type_count];
- bool init(Device_Vk* dev, Pack_File* f);
- bool init_module(
+ bool init(Device_Vk* dev, Arena* a, Pack_File* f);
+ VkShaderModule make_module(
Device_Vk* dev,
- int stage,
char* buf,
int size
);
void destroy(Device_Vk* dev) override;
int find_descriptor(const char* name);
+ int find_module(Shader_Type type, int mask);
+ int find_opt(Shader_Type, const char* name);
static VkShaderStageFlagBits stage(Shader_Type type) {
switch (type) {
@@ -2811,12 +2825,24 @@ void Pipeline_Vk::init_stages(
zero(sis, sizeof *sis * count);
for (i = 0, count = 0; i < shader_type_count; i++) {
if (shader.modules[i]) {
+ int idx = shader.find_module(
+ (Shader_Type)i,
+ desc.shader_masks[i]
+ );
+ VkShaderModule mod;
+ if (idx < 0) {
+ mod = shader.modules[i][0].mod;
+ print_war("Shader variant not found; using the default >~<\n");
+ print(" ^ mask was 0x%x\n", desc.shader_masks[i]);
+ } else
+ mod = shader.modules[i][idx].mod;
+ assert(idx >= 0);
auto& si = sis[i];
si.sType = VK_STRUCTURE_TYPE_PIPELINE_SHADER_STAGE_CREATE_INFO;
si.flags = 0;
si.stage = Shader_Vk::stage((Shader_Type)i);
- si.module = shader.modules[i];
- si.pName = shader.entrypoints[i];
+ si.module = mod;
+ si.pName = "main";
count++;
}
}
@@ -3396,9 +3422,8 @@ void Vertex_Format_Vk::optimise(const Vertex_Format_Vk* shadervf) {
}
}
-bool Shader_Vk::init_module(
+VkShaderModule Shader_Vk::make_module(
Device_Vk* dev,
- int stage,
char* buf,
int size
) {
@@ -3409,8 +3434,9 @@ bool Shader_Vk::init_module(
mi.codeSize = size;
mi.pCode = (uint32_t*)buf;
r = vkCreateShaderModule(dev->dev, &mi, &dev->ac, &m);
- modules[stage] = m;
- return r == VK_SUCCESS;
+ if (r == VK_SUCCESS)
+ return m;
+ return 0;
}
int Shader_Vk::Vertex_Format::find_binding(const char* name) {
@@ -3522,8 +3548,11 @@ void Shader_Vk::Vertex_Format::destroy(Device_Vk* dev) {
void Shader_Vk::destroy(Device_Vk* dev) {
int i;
for (i = 0; i < shader_type_count; i++)
- if (modules[i])
- vkDestroyShaderModule(dev->dev, modules[i], &dev->ac);
+ if (modules[i]) {
+ int j, e = module_count[i];
+ for (j = 0; j < e; j++)
+ vkDestroyShaderModule(dev->dev, modules[i][j].mod, &dev->ac);
+ }
vfd.destroy(dev);
heap_free(dev->heap, descs);
dev->destroy_vertex_format(vf);
@@ -3554,6 +3583,11 @@ int Shader::descriptor_binding(const char* name) {
return sh->descs[idx].slot;
}
+int Shader::opt_mask(Shader_Type type, const char* name) {
+ Shader_Vk* sh = (Shader_Vk*)this;
+ return sh->find_opt(type, name);
+}
+
int Shader::descriptor_stage(int slot) {
Shader_Vk* sh = (Shader_Vk*)this;
int i;
@@ -3909,11 +3943,10 @@ Asset* Shader_Loader::load(
Shader_Vk* shader;
Shader_Id id;
(void)s;
- (void)a;
(void)filename;
id = dev->alloc_shader();
shader = (Shader_Vk*)&dev->get_shader(id);
- if (!shader->init(dev, f)) {
+ if (!shader->init(dev, a, f)) {
dev->shaders.remove(id);
return 0;
}
@@ -3939,7 +3972,46 @@ int Shader_Vk::find_descriptor(const char* name) {
return -1;
}
-bool Shader_Vk::init(Device_Vk* dev, Pack_File* f) {
+int Shader_Vk::find_module(
+ Shader_Type type,
+ int mask
+) {
+ int i;
+ int count = module_count[type];
+ Shader_Module* arr = modules[type];
+ int bucket = (int)(
+ fnv1a64((uint8_t*)&mask, sizeof mask) %
+ count
+ );
+ for (i = 0; i < count; i++) {
+ Shader_Module& mod = arr[bucket];
+ if (mod.mask == mask)
+ return bucket;
+ bucket = (bucket + 1) % count;
+ }
+ return -1;
+}
+
+int Shader_Vk::find_opt(
+ Shader_Type type,
+ const char* name
+) {
+ int count = module_count[type], i;
+ int bucket = (int)(
+ hash_string(name) %
+ count
+ );
+ int stage = 1 << type;
+ for (i = 0; i < count; i++) {
+ Option& o = options[bucket];
+ if (string_equal(name, o.name) && (o.stage & stage))
+ return o.mask;
+ bucket = (bucket + 1) % count;
+ }
+ return 0;
+}
+
+bool Shader_Vk::init(Device_Vk* dev, Arena* a, Pack_File* f) {
char magic[4];
int binding_count, target_count, i;
pack_read(f, magic, 4);
@@ -3953,6 +4025,7 @@ bool Shader_Vk::init(Device_Vk* dev, Pack_File* f) {
pack_read(f, &binding_count, 4);
pack_read(f, &target_count, 4);
pack_read(f, &desc_count, 4);
+ pack_read(f, &opt_count, 4);
assert(binding_count);
vfd.binding_count = binding_count;
if (!vfd.init(dev, f))
@@ -4000,24 +4073,60 @@ bool Shader_Vk::init(Device_Vk* dev, Pack_File* f) {
desc_count * sizeof *descs
);
pack_read(f, descs, desc_count * sizeof *descs);
+ options = (Option*)arena_alloc(
+ a,
+ opt_count * sizeof *options
+ );
+ pack_read(f, options, opt_count * sizeof *options);
for (i = 0; i < shader_type_count; i++) {
- int o, s;
- pack_read(f, &o, 4);
- pack_read(f, &s, 4);
- if (o) {
- bool r;
- int before = pack_tell(f);
- char* buf = (char*)heap_alloc(dev->heap, s);
- pack_seek(f, o, seek_rel_start);
- pack_read(f, buf, s);
- r = init_module(dev, i, buf, s);
- heap_free(dev->heap, buf);
- pack_seek(f, before, seek_rel_start);
- if (!r) return false;
+ int c;
+ pack_read(f, &c, 4);
+ module_count[i] = c;
+ if (c) {
+ int o, s, mask;
+ int bucket, j;
+ Shader_Module* m = (Shader_Module*)arena_alloc(
+ a,
+ c * sizeof *m
+ );
+ for (j = 0; j < c; j++) {
+ m[j].mask = -1;
+ }
+ for (j = 0; j < c; j++) {
+ int k;
+ pack_read(f, &o, 4); /* H_Variant */
+ pack_read(f, &s, 4);
+ pack_read(f, &mask, 4);
+ pack_seek(f, 4, seek_rel_cur);
+ bucket = (int)(
+ fnv1a64((uint8_t*)&m, sizeof m) %
+ c
+ );
+ for (k = 0; k < c; k++) {
+ Shader_Module& mod = m[bucket];
+ if (mod.mask == -1)
+ goto found;
+ bucket = (bucket + 1) % c;
+ }
+ assert(0);
+ {
+ found:
+ char* buf = (char*)heap_alloc(dev->heap, s);
+ VkShaderModule r;
+ int before = pack_tell(f);
+ pack_seek(f, o, seek_rel_start);
+ pack_read(f, buf, s);
+ r = make_module(dev, buf, s);
+ heap_free(dev->heap, buf);
+ pack_seek(f, before, seek_rel_start);
+ if (!r) return false;
+ m[bucket] = Shader_Module { mask, r };
+ }
+ }
+ modules[i] = m;
} else {
- modules[i] = VK_NULL_HANDLE;
+ modules[i] = 0;
}
- pack_read(f, entrypoints[i], 24);
}
return true;
}
diff --git a/video.hpp b/video.hpp
index 530b126..f1bedb1 100644
--- a/video.hpp
+++ b/video.hpp
@@ -134,12 +134,18 @@ struct Pipeline {
Vertex_Format_Id vertex_format;
Shader_Id shader;
int samples;
+ int shader_masks[shader_type_count];
Descriptor descriptors[pipeline_max_descriptors];
int descriptor_count;
void hash();
bool pipeline_eq(const Pipeline& other) const {
+ int i;
+ for (i = 0; i < shader_type_count; i++) {
+ if (other.shader_masks[i] != shader_masks[i])
+ return false;
+ }
return
shader == other.shader &&
vertex_format == other.vertex_format &&
@@ -333,6 +339,7 @@ struct Pipeline_Builder {
);
PB& cull(Cull_Mode mode);
PB& shader(Shader_Id s);
+ PB& option(Shader_Type type, int mask);
PB& vertex_format(Vertex_Format_Id vf);
PB& texture(int binding, Texture_Id t, Sampler_Id s);
PB& cbuffer(
@@ -588,6 +595,7 @@ struct Shader : public Asset {
int attribute_index(const char* name);
int target_index(const char* name);
int descriptor_binding(const char* name);
+ int opt_mask(Shader_Type type, const char* name);
int descriptor_stage(int slot);
};