Lines Matching +full:arr +full:- +full:diff
47 /* the next index to assign to a NIR in-memory object */
74 /* the next index to assign to a NIR in-memory object */
77 /* The length of the index -> object table */
95 uint32_t index = ctx->next_idx++; in write_add_object()
97 _mesa_hash_table_insert(ctx->remap_table, obj, (void *)(uintptr_t)index); in write_add_object()
103 struct hash_entry *entry = _mesa_hash_table_search(ctx->remap_table, obj); in write_lookup_object()
105 return (uint32_t)(uintptr_t)entry->data; in write_lookup_object()
111 assert(ctx->next_idx < ctx->idx_table_len); in read_add_object()
112 ctx->idx_table[ctx->next_idx++] = obj; in read_add_object()
118 assert(idx < ctx->idx_table_len); in read_lookup_object()
119 return ctx->idx_table[idx]; in read_lookup_object()
125 return read_lookup_object(ctx, blob_read_uint32(ctx->blob)); in read_object()
142 return 1 << (bit_size - 1); in decode_bit_size_3bits()
179 blob_write_bytes(ctx->blob, c->values, sizeof(c->values)); in write_constant()
180 blob_write_uint32(ctx->blob, c->num_elements); in write_constant()
181 for (unsigned i = 0; i < c->num_elements; i++) in write_constant()
182 write_constant(ctx, c->elements[i]); in write_constant()
190 static const nir_const_value zero_vals[ARRAY_SIZE(c->values)] = { 0 }; in read_constant()
191 blob_copy_bytes(ctx->blob, (uint8_t *)c->values, sizeof(c->values)); in read_constant()
192 c->is_null_constant = memcmp(c->values, zero_vals, sizeof(c->values)) == 0; in read_constant()
193 c->num_elements = blob_read_uint32(ctx->blob); in read_constant()
194 c->elements = ralloc_array(nvar, nir_constant *, c->num_elements); in read_constant()
195 for (unsigned i = 0; i < c->num_elements; i++) { in read_constant()
196 c->elements[i] = read_constant(ctx, nvar); in read_constant()
197 c->is_null_constant &= c->elements[i]->is_null_constant; in read_constant()
240 assert(var->num_state_slots < (1 << 7)); in write_variable()
246 flags.u.has_name = !ctx->strip && var->name; in write_variable()
247 flags.u.has_constant_initializer = !!(var->constant_initializer); in write_variable()
248 flags.u.has_pointer_initializer = !!(var->pointer_initializer); in write_variable()
249 flags.u.has_interface_type = !!(var->interface_type); in write_variable()
250 flags.u.type_same_as_last = var->type == ctx->last_type; in write_variable()
252 var->interface_type && var->interface_type == ctx->last_interface_type; in write_variable()
253 flags.u.num_state_slots = var->num_state_slots; in write_variable()
254 flags.u.num_members = var->num_members; in write_variable()
256 struct nir_variable_data data = var->data; in write_variable()
261 if (ctx->strip && in write_variable()
267 /* Temporary variables don't serialize var->data. */ in write_variable()
275 tmp.location = ctx->last_var_data.location; in write_variable()
276 tmp.location_frac = ctx->last_var_data.location_frac; in write_variable()
277 tmp.driver_location = ctx->last_var_data.driver_location; in write_variable()
282 if (memcmp(&ctx->last_var_data, &tmp, sizeof(tmp)) == 0 && in write_variable()
283 abs((int)data.location - in write_variable()
284 (int)ctx->last_var_data.location) < (1 << 12) && in write_variable()
285 abs((int)data.driver_location - in write_variable()
286 (int)ctx->last_var_data.driver_location) < (1 << 15)) in write_variable()
292 flags.u.ray_query = var->data.ray_query; in write_variable()
294 blob_write_uint32(ctx->blob, flags.u32); in write_variable()
297 encode_type_to_blob(ctx->blob, var->type); in write_variable()
298 ctx->last_type = var->type; in write_variable()
301 if (var->interface_type && !flags.u.interface_type_same_as_last) { in write_variable()
302 encode_type_to_blob(ctx->blob, var->interface_type); in write_variable()
303 ctx->last_interface_type = var->interface_type; in write_variable()
307 blob_write_string(ctx->blob, var->name); in write_variable()
312 blob_write_bytes(ctx->blob, &data, sizeof(data)); in write_variable()
316 union packed_var_data_diff diff; in write_variable() local
318 diff.u.location = data.location - ctx->last_var_data.location; in write_variable()
319 diff.u.location_frac = data.location_frac - in write_variable()
320 ctx->last_var_data.location_frac; in write_variable()
321 diff.u.driver_location = data.driver_location - in write_variable()
322 ctx->last_var_data.driver_location; in write_variable()
324 blob_write_uint32(ctx->blob, diff.u32); in write_variable()
327 ctx->last_var_data = data; in write_variable()
330 for (unsigned i = 0; i < var->num_state_slots; i++) { in write_variable()
331 blob_write_bytes(ctx->blob, &var->state_slots[i], in write_variable()
332 sizeof(var->state_slots[i])); in write_variable()
334 if (var->constant_initializer) in write_variable()
335 write_constant(ctx, var->constant_initializer); in write_variable()
336 if (var->pointer_initializer) in write_variable()
337 blob_write_uint32(ctx->blob, in write_variable()
338 write_lookup_object(ctx, var->pointer_initializer)); in write_variable()
339 if (var->num_members > 0) { in write_variable()
340 blob_write_bytes(ctx->blob, (uint8_t *)var->members, in write_variable()
341 var->num_members * sizeof(*var->members)); in write_variable()
348 nir_variable *var = rzalloc(ctx->nir, nir_variable); in read_variable()
352 flags.u32 = blob_read_uint32(ctx->blob); in read_variable()
355 var->type = ctx->last_type; in read_variable()
357 var->type = decode_type_from_blob(ctx->blob); in read_variable()
358 ctx->last_type = var->type; in read_variable()
363 var->interface_type = ctx->last_interface_type; in read_variable()
365 var->interface_type = decode_type_from_blob(ctx->blob); in read_variable()
366 ctx->last_interface_type = var->interface_type; in read_variable()
371 const char *name = blob_read_string(ctx->blob); in read_variable()
372 var->name = ralloc_strdup(var, name); in read_variable()
374 var->name = NULL; in read_variable()
378 var->data.mode = nir_var_shader_temp; in read_variable()
380 var->data.mode = nir_var_function_temp; in read_variable()
382 blob_copy_bytes(ctx->blob, (uint8_t *)&var->data, sizeof(var->data)); in read_variable()
383 ctx->last_var_data = var->data; in read_variable()
385 union packed_var_data_diff diff; in read_variable() local
386 diff.u32 = blob_read_uint32(ctx->blob); in read_variable()
388 var->data = ctx->last_var_data; in read_variable()
389 var->data.location += diff.u.location; in read_variable()
390 var->data.location_frac += diff.u.location_frac; in read_variable()
391 var->data.driver_location += diff.u.driver_location; in read_variable()
393 ctx->last_var_data = var->data; in read_variable()
396 var->data.ray_query = flags.u.ray_query; in read_variable()
398 var->num_state_slots = flags.u.num_state_slots; in read_variable()
399 if (var->num_state_slots != 0) { in read_variable()
400 var->state_slots = ralloc_array(var, nir_state_slot, in read_variable()
401 var->num_state_slots); in read_variable()
402 for (unsigned i = 0; i < var->num_state_slots; i++) { in read_variable()
403 blob_copy_bytes(ctx->blob, &var->state_slots[i], in read_variable()
404 sizeof(var->state_slots[i])); in read_variable()
408 var->constant_initializer = read_constant(ctx, var); in read_variable()
410 var->constant_initializer = NULL; in read_variable()
413 var->pointer_initializer = read_object(ctx); in read_variable()
415 var->pointer_initializer = NULL; in read_variable()
417 var->num_members = flags.u.num_members; in read_variable()
418 if (var->num_members > 0) { in read_variable()
419 var->members = ralloc_array(var, struct nir_variable_data, in read_variable()
420 var->num_members); in read_variable()
421 blob_copy_bytes(ctx->blob, (uint8_t *)var->members, in read_variable()
422 var->num_members * sizeof(*var->members)); in read_variable()
431 blob_write_uint32(ctx->blob, exec_list_length(src)); in write_var_list()
441 unsigned num_vars = blob_read_uint32(ctx->blob); in read_var_list()
444 exec_list_push_tail(dst, &var->node); in read_var_list()
451 unsigned _pad : 2; /* <-- Header */
453 unsigned _footer : 10; /* <-- Footer */
456 unsigned _header : 22; /* <-- Header */
457 unsigned _pad : 2; /* <-- Footer */
464 unsigned _header : 22; /* <-- Header */
465 unsigned src_type : 5; /* <-- Footer */
473 header.any.object_idx = write_lookup_object(ctx, src->ssa); in write_src_full()
474 blob_write_uint32(ctx->blob, header.u32); in write_src_full()
489 header.u32 = blob_read_uint32(ctx->blob); in read_src()
491 src->ssa = read_lookup_object(ctx, header.any.object_idx); in read_src()
523 * good for floating-point decimals
527 /* packed_value contains low 19 bits, high bits are sign-extended */
618 encode_num_components_in_3bits(def->num_components); in write_def()
619 pdef.bit_size = encode_bit_size_3bits(def->bit_size); in write_def()
620 pdef.divergent = def->divergent; in write_def()
630 if (ctx->last_instr_type == nir_instr_type_alu) { in write_def()
631 assert(ctx->last_alu_header_offset); in write_def()
633 last_header.u32 = ctx->last_alu_header; in write_def()
646 blob_overwrite_uint32(ctx->blob, ctx->last_alu_header_offset, in write_def()
648 ctx->last_alu_header = last_header.u32; in write_def()
654 ctx->last_alu_header_offset = blob_reserve_uint32(ctx->blob); in write_def()
655 blob_overwrite_uint32(ctx->blob, ctx->last_alu_header_offset, header.u32); in write_def()
656 ctx->last_alu_header = header.u32; in write_def()
659 blob_write_uint32(ctx->blob, header.u32); in write_def()
663 blob_write_uint32(ctx->blob, def->num_components); in write_def()
678 num_components = blob_read_uint32(ctx->blob); in read_def()
682 def->divergent = pdef.divergent; in read_def()
690 return ctx->next_idx < (1 << 16); in are_object_ids_16bit()
696 unsigned num_srcs = nir_op_infos[alu->op].num_inputs; in is_alu_src_ssa_16bit()
705 if (i < 2 && chan == 0 && alu->src[i].swizzle[chan] < 4) in is_alu_src_ssa_16bit()
708 if (alu->src[i].swizzle[chan] != chan) in is_alu_src_ssa_16bit()
719 unsigned num_srcs = nir_op_infos[alu->op].num_inputs; in write_alu()
726 header.alu.instr_type = alu->instr.type; in write_alu()
727 header.alu.exact = alu->exact; in write_alu()
728 header.alu.no_signed_wrap = alu->no_signed_wrap; in write_alu()
729 header.alu.no_unsigned_wrap = alu->no_unsigned_wrap; in write_alu()
730 header.alu.op = alu->op; in write_alu()
735 header.alu.writemask_or_two_swizzles = alu->src[0].swizzle[0]; in write_alu()
737 header.alu.writemask_or_two_swizzles |= alu->src[1].swizzle[0] << 2; in write_alu()
740 write_def(ctx, &alu->def, header, alu->instr.type); in write_alu()
744 unsigned idx = write_lookup_object(ctx, alu->src[i].src.ssa); in write_alu()
746 blob_write_uint16(ctx->blob, idx); in write_alu()
751 unsigned src_components = nir_src_num_components(alu->src[i].src); in write_alu()
757 src.alu.swizzle_x = alu->src[i].swizzle[0]; in write_alu()
758 src.alu.swizzle_y = alu->src[i].swizzle[1]; in write_alu()
759 src.alu.swizzle_z = alu->src[i].swizzle[2]; in write_alu()
760 src.alu.swizzle_w = alu->src[i].swizzle[3]; in write_alu()
763 write_src_full(ctx, &alu->src[i].src, src); in write_alu()
771 value |= (uint32_t)alu->src[i].swizzle[o + j] << (4 * j); /* 4 bits per swizzle */ in write_alu()
774 blob_write_uint32(ctx->blob, value); in write_alu()
785 nir_alu_instr *alu = nir_alu_instr_create(ctx->nir, header.alu.op); in read_alu()
787 alu->exact = header.alu.exact; in read_alu()
788 alu->no_signed_wrap = header.alu.no_signed_wrap; in read_alu()
789 alu->no_unsigned_wrap = header.alu.no_unsigned_wrap; in read_alu()
791 read_def(ctx, &alu->def, &alu->instr, header); in read_alu()
795 nir_alu_src *src = &alu->src[i]; in read_alu()
796 src->src.ssa = read_lookup_object(ctx, blob_read_uint16(ctx->blob)); in read_alu()
798 memset(&src->swizzle, 0, sizeof(src->swizzle)); in read_alu()
803 src->swizzle[chan] = chan; in read_alu()
807 union packed_src src = read_src(ctx, &alu->src[i].src); in read_alu()
809 unsigned src_components = nir_src_num_components(alu->src[i].src); in read_alu()
812 memset(&alu->src[i].swizzle, 0, sizeof(alu->src[i].swizzle)); in read_alu()
815 alu->src[i].swizzle[0] = src.alu.swizzle_x; in read_alu()
816 alu->src[i].swizzle[1] = src.alu.swizzle_y; in read_alu()
817 alu->src[i].swizzle[2] = src.alu.swizzle_z; in read_alu()
818 alu->src[i].swizzle[3] = src.alu.swizzle_w; in read_alu()
822 unsigned value = blob_read_uint32(ctx->blob); in read_alu()
825 alu->src[i].swizzle[o + j] = in read_alu()
834 alu->src[0].swizzle[0] = header.alu.writemask_or_two_swizzles & 0x3; in read_alu()
836 alu->src[1].swizzle[0] = header.alu.writemask_or_two_swizzles >> 2; in read_alu()
849 return modes << (ffs(nir_var_mem_generic) - 1); in decode_deref_modes()
871 enc = modes >> (ffs(nir_var_mem_generic) - 1); in encode_deref_modes()
876 enc = ffs(modes) - 1; in encode_deref_modes()
886 assert(deref->deref_type < 8); in write_deref()
891 header.deref.instr_type = deref->instr.type; in write_deref()
892 header.deref.deref_type = deref->deref_type; in write_deref()
894 if (deref->deref_type == nir_deref_type_cast) { in write_deref()
895 header.deref.modes = encode_deref_modes(deref->modes); in write_deref()
896 header.deref.cast_type_same_as_last = deref->type == ctx->last_type; in write_deref()
900 if (deref->deref_type == nir_deref_type_var) { in write_deref()
901 var_idx = write_lookup_object(ctx, deref->var); in write_deref()
906 if (deref->deref_type == nir_deref_type_array || in write_deref()
907 deref->deref_type == nir_deref_type_ptr_as_array) { in write_deref()
910 header.deref.in_bounds = deref->arr.in_bounds; in write_deref()
913 write_def(ctx, &deref->def, header, deref->instr.type); in write_deref()
915 switch (deref->deref_type) { in write_deref()
918 blob_write_uint32(ctx->blob, var_idx); in write_deref()
922 write_src(ctx, &deref->parent); in write_deref()
923 blob_write_uint32(ctx->blob, deref->strct.index); in write_deref()
929 blob_write_uint16(ctx->blob, in write_deref()
930 write_lookup_object(ctx, deref->parent.ssa)); in write_deref()
931 blob_write_uint16(ctx->blob, in write_deref()
932 write_lookup_object(ctx, deref->arr.index.ssa)); in write_deref()
934 write_src(ctx, &deref->parent); in write_deref()
935 write_src(ctx, &deref->arr.index); in write_deref()
940 write_src(ctx, &deref->parent); in write_deref()
941 blob_write_uint32(ctx->blob, deref->cast.ptr_stride); in write_deref()
942 blob_write_uint32(ctx->blob, deref->cast.align_mul); in write_deref()
943 blob_write_uint32(ctx->blob, deref->cast.align_offset); in write_deref()
945 encode_type_to_blob(ctx->blob, deref->type); in write_deref()
946 ctx->last_type = deref->type; in write_deref()
951 write_src(ctx, &deref->parent); in write_deref()
963 nir_deref_instr *deref = nir_deref_instr_create(ctx->nir, deref_type); in read_deref()
965 read_def(ctx, &deref->def, &deref->instr, header); in read_deref()
969 switch (deref->deref_type) { in read_deref()
972 deref->var = read_lookup_object(ctx, header.deref_var.object_idx); in read_deref()
974 deref->var = read_object(ctx); in read_deref()
976 deref->type = deref->var->type; in read_deref()
980 read_src(ctx, &deref->parent); in read_deref()
981 parent = nir_src_as_deref(deref->parent); in read_deref()
982 deref->strct.index = blob_read_uint32(ctx->blob); in read_deref()
983 deref->type = glsl_get_struct_field(parent->type, deref->strct.index); in read_deref()
989 deref->parent.ssa = read_lookup_object(ctx, blob_read_uint16(ctx->blob)); in read_deref()
990 deref->arr.index.ssa = read_lookup_object(ctx, blob_read_uint16(ctx->blob)); in read_deref()
992 read_src(ctx, &deref->parent); in read_deref()
993 read_src(ctx, &deref->arr.index); in read_deref()
996 deref->arr.in_bounds = header.deref.in_bounds; in read_deref()
998 parent = nir_src_as_deref(deref->parent); in read_deref()
999 if (deref->deref_type == nir_deref_type_array) in read_deref()
1000 deref->type = glsl_get_array_element(parent->type); in read_deref()
1002 deref->type = parent->type; in read_deref()
1006 read_src(ctx, &deref->parent); in read_deref()
1007 deref->cast.ptr_stride = blob_read_uint32(ctx->blob); in read_deref()
1008 deref->cast.align_mul = blob_read_uint32(ctx->blob); in read_deref()
1009 deref->cast.align_offset = blob_read_uint32(ctx->blob); in read_deref()
1011 deref->type = ctx->last_type; in read_deref()
1013 deref->type = decode_type_from_blob(ctx->blob); in read_deref()
1014 ctx->last_type = deref->type; in read_deref()
1019 read_src(ctx, &deref->parent); in read_deref()
1020 parent = nir_src_as_deref(deref->parent); in read_deref()
1021 deref->type = glsl_get_array_element(parent->type); in read_deref()
1029 deref->modes = deref->var->data.mode; in read_deref()
1030 } else if (deref->deref_type == nir_deref_type_cast) { in read_deref()
1031 deref->modes = decode_deref_modes(header.deref.modes); in read_deref()
1033 deref->modes = nir_instr_as_deref(deref->parent.ssa->parent_instr)->modes; in read_deref()
1044 unsigned num_srcs = nir_intrinsic_infos[intrin->intrinsic].num_srcs; in write_intrinsic()
1045 unsigned num_indices = nir_intrinsic_infos[intrin->intrinsic].num_indices; in write_intrinsic()
1046 assert(intrin->intrinsic < 1024); in write_intrinsic()
1051 header.intrinsic.instr_type = intrin->instr.type; in write_intrinsic()
1052 header.intrinsic.intrinsic = intrin->intrinsic; in write_intrinsic()
1058 unsigned max = util_last_bit(intrin->const_index[i]); in write_intrinsic()
1069 intrin->const_index[i] << (i * bit_size); in write_intrinsic()
1079 if (nir_intrinsic_infos[intrin->intrinsic].has_dest) in write_intrinsic()
1080 write_def(ctx, &intrin->def, header, intrin->instr.type); in write_intrinsic()
1082 blob_write_uint32(ctx->blob, header.u32); in write_intrinsic()
1085 write_src(ctx, &intrin->src[i]); in write_intrinsic()
1091 blob_write_uint8(ctx->blob, intrin->const_index[i]); in write_intrinsic()
1095 blob_write_uint16(ctx->blob, intrin->const_index[i]); in write_intrinsic()
1099 blob_write_uint32(ctx->blob, intrin->const_index[i]); in write_intrinsic()
1109 nir_intrinsic_instr *intrin = nir_intrinsic_instr_create(ctx->nir, op); in read_intrinsic()
1115 read_def(ctx, &intrin->def, &intrin->instr, header); in read_intrinsic()
1118 read_src(ctx, &intrin->src[i]); in read_intrinsic()
1125 intrin->num_components = intrin->def.num_components; in read_intrinsic()
1129 intrin->num_components = nir_src_num_components(intrin->src[i]); in read_intrinsic()
1141 intrin->const_index[i] = in read_intrinsic()
1149 intrin->const_index[i] = blob_read_uint8(ctx->blob); in read_intrinsic()
1153 intrin->const_index[i] = blob_read_uint16(ctx->blob); in read_intrinsic()
1157 intrin->const_index[i] = blob_read_uint32(ctx->blob); in read_intrinsic()
1168 assert(lc->def.num_components >= 1 && lc->def.num_components <= 16); in write_load_const()
1172 header.load_const.instr_type = lc->instr.type; in write_load_const()
1173 header.load_const.last_component = lc->def.num_components - 1; in write_load_const()
1174 header.load_const.bit_size = encode_bit_size_3bits(lc->def.bit_size); in write_load_const()
1177 /* Try to pack 1-component constants into the 19 free bits in the header. */ in write_load_const()
1178 if (lc->def.num_components == 1) { in write_load_const()
1179 switch (lc->def.bit_size) { in write_load_const()
1181 if ((lc->value[0].u64 & 0x1fffffffffffull) == 0) { in write_load_const()
1184 header.load_const.packed_value = lc->value[0].u64 >> 45; in write_load_const()
1185 } else if (util_mask_sign_extend(lc->value[0].i64, 19) == lc->value[0].i64) { in write_load_const()
1186 /* packed_value contains low 19 bits, high bits are sign-extended */ in write_load_const()
1188 header.load_const.packed_value = lc->value[0].u64; in write_load_const()
1193 if ((lc->value[0].u32 & 0x1fff) == 0) { in write_load_const()
1195 header.load_const.packed_value = lc->value[0].u32 >> 13; in write_load_const()
1196 } else if (util_mask_sign_extend(lc->value[0].i32, 19) == lc->value[0].i32) { in write_load_const()
1198 header.load_const.packed_value = lc->value[0].u32; in write_load_const()
1204 header.load_const.packed_value = lc->value[0].u16; in write_load_const()
1208 header.load_const.packed_value = lc->value[0].u8; in write_load_const()
1212 header.load_const.packed_value = lc->value[0].b; in write_load_const()
1219 blob_write_uint32(ctx->blob, header.u32); in write_load_const()
1222 switch (lc->def.bit_size) { in write_load_const()
1224 blob_write_bytes(ctx->blob, lc->value, in write_load_const()
1225 sizeof(*lc->value) * lc->def.num_components); in write_load_const()
1229 for (unsigned i = 0; i < lc->def.num_components; i++) in write_load_const()
1230 blob_write_uint32(ctx->blob, lc->value[i].u32); in write_load_const()
1234 for (unsigned i = 0; i < lc->def.num_components; i++) in write_load_const()
1235 blob_write_uint16(ctx->blob, lc->value[i].u16); in write_load_const()
1239 assert(lc->def.bit_size <= 8); in write_load_const()
1240 for (unsigned i = 0; i < lc->def.num_components; i++) in write_load_const()
1241 blob_write_uint8(ctx->blob, lc->value[i].u8); in write_load_const()
1246 write_add_object(ctx, &lc->def); in write_load_const()
1253 nir_load_const_instr_create(ctx->nir, header.load_const.last_component + 1, in read_load_const()
1255 lc->def.divergent = false; in read_load_const()
1259 switch (lc->def.bit_size) { in read_load_const()
1261 lc->value[0].u64 = (uint64_t)header.load_const.packed_value << 45; in read_load_const()
1264 lc->value[0].u32 = (uint64_t)header.load_const.packed_value << 13; in read_load_const()
1272 switch (lc->def.bit_size) { in read_load_const()
1274 lc->value[0].u64 = header.load_const.packed_value; in read_load_const()
1275 if (lc->value[0].u64 >> 18) in read_load_const()
1276 lc->value[0].u64 |= UINT64_C(0xfffffffffff80000); in read_load_const()
1279 lc->value[0].u32 = header.load_const.packed_value; in read_load_const()
1280 if (lc->value[0].u32 >> 18) in read_load_const()
1281 lc->value[0].u32 |= 0xfff80000; in read_load_const()
1284 lc->value[0].u16 = header.load_const.packed_value; in read_load_const()
1287 lc->value[0].u8 = header.load_const.packed_value; in read_load_const()
1290 lc->value[0].b = header.load_const.packed_value; in read_load_const()
1298 switch (lc->def.bit_size) { in read_load_const()
1300 blob_copy_bytes(ctx->blob, lc->value, sizeof(*lc->value) * lc->def.num_components); in read_load_const()
1304 for (unsigned i = 0; i < lc->def.num_components; i++) in read_load_const()
1305 lc->value[i].u32 = blob_read_uint32(ctx->blob); in read_load_const()
1309 for (unsigned i = 0; i < lc->def.num_components; i++) in read_load_const()
1310 lc->value[i].u16 = blob_read_uint16(ctx->blob); in read_load_const()
1314 assert(lc->def.bit_size <= 8); in read_load_const()
1315 for (unsigned i = 0; i < lc->def.num_components; i++) in read_load_const()
1316 lc->value[i].u8 = blob_read_uint8(ctx->blob); in read_load_const()
1322 read_add_object(ctx, &lc->def); in read_load_const()
1329 assert(undef->def.num_components >= 1 && undef->def.num_components <= 16); in write_ssa_undef()
1334 header.undef.instr_type = undef->instr.type; in write_ssa_undef()
1335 header.undef.last_component = undef->def.num_components - 1; in write_ssa_undef()
1336 header.undef.bit_size = encode_bit_size_3bits(undef->def.bit_size); in write_ssa_undef()
1338 blob_write_uint32(ctx->blob, header.u32); in write_ssa_undef()
1339 write_add_object(ctx, &undef->def); in write_ssa_undef()
1346 nir_undef_instr_create(ctx->nir, header.undef.last_component + 1, in read_ssa_undef()
1349 undef->def.divergent = false; in read_ssa_undef()
1351 read_add_object(ctx, &undef->def); in read_ssa_undef()
1377 assert(tex->num_srcs < 16); in write_tex()
1378 assert(tex->op < 32); in write_tex()
1383 header.tex.instr_type = tex->instr.type; in write_tex()
1384 header.tex.num_srcs = tex->num_srcs; in write_tex()
1385 header.tex.op = tex->op; in write_tex()
1387 write_def(ctx, &tex->def, header, tex->instr.type); in write_tex()
1389 blob_write_uint32(ctx->blob, tex->texture_index); in write_tex()
1390 blob_write_uint32(ctx->blob, tex->sampler_index); in write_tex()
1391 blob_write_uint32(ctx->blob, tex->backend_flags); in write_tex()
1392 if (tex->op == nir_texop_tg4) in write_tex()
1393 blob_write_bytes(ctx->blob, tex->tg4_offsets, sizeof(tex->tg4_offsets)); in write_tex()
1397 .u.sampler_dim = tex->sampler_dim, in write_tex()
1398 .u.dest_type = tex->dest_type, in write_tex()
1399 .u.coord_components = tex->coord_components, in write_tex()
1400 .u.is_array = tex->is_array, in write_tex()
1401 .u.is_shadow = tex->is_shadow, in write_tex()
1402 .u.is_new_style_shadow = tex->is_new_style_shadow, in write_tex()
1403 .u.is_sparse = tex->is_sparse, in write_tex()
1404 .u.component = tex->component, in write_tex()
1405 .u.texture_non_uniform = tex->texture_non_uniform, in write_tex()
1406 .u.sampler_non_uniform = tex->sampler_non_uniform, in write_tex()
1407 .u.array_is_lowered_cube = tex->array_is_lowered_cube, in write_tex()
1408 .u.is_gather_implicit_lod = tex->is_gather_implicit_lod, in write_tex()
1410 blob_write_uint32(ctx->blob, packed.u32); in write_tex()
1412 for (unsigned i = 0; i < tex->num_srcs; i++) { in write_tex()
1415 src.tex.src_type = tex->src[i].src_type; in write_tex()
1416 write_src_full(ctx, &tex->src[i].src, src); in write_tex()
1423 nir_tex_instr *tex = nir_tex_instr_create(ctx->nir, header.tex.num_srcs); in read_tex()
1425 read_def(ctx, &tex->def, &tex->instr, header); in read_tex()
1427 tex->op = header.tex.op; in read_tex()
1428 tex->texture_index = blob_read_uint32(ctx->blob); in read_tex()
1429 tex->sampler_index = blob_read_uint32(ctx->blob); in read_tex()
1430 tex->backend_flags = blob_read_uint32(ctx->blob); in read_tex()
1431 if (tex->op == nir_texop_tg4) in read_tex()
1432 blob_copy_bytes(ctx->blob, tex->tg4_offsets, sizeof(tex->tg4_offsets)); in read_tex()
1435 packed.u32 = blob_read_uint32(ctx->blob); in read_tex()
1436 tex->sampler_dim = packed.u.sampler_dim; in read_tex()
1437 tex->dest_type = packed.u.dest_type; in read_tex()
1438 tex->coord_components = packed.u.coord_components; in read_tex()
1439 tex->is_array = packed.u.is_array; in read_tex()
1440 tex->is_shadow = packed.u.is_shadow; in read_tex()
1441 tex->is_new_style_shadow = packed.u.is_new_style_shadow; in read_tex()
1442 tex->is_sparse = packed.u.is_sparse; in read_tex()
1443 tex->component = packed.u.component; in read_tex()
1444 tex->texture_non_uniform = packed.u.texture_non_uniform; in read_tex()
1445 tex->sampler_non_uniform = packed.u.sampler_non_uniform; in read_tex()
1446 tex->array_is_lowered_cube = packed.u.array_is_lowered_cube; in read_tex()
1447 tex->is_gather_implicit_lod = packed.u.is_gather_implicit_lod; in read_tex()
1449 for (unsigned i = 0; i < tex->num_srcs; i++) { in read_tex()
1450 union packed_src src = read_src(ctx, &tex->src[i].src); in read_tex()
1451 tex->src[i].src_type = src.tex.src_type; in read_tex()
1463 header.phi.instr_type = phi->instr.type; in write_phi()
1464 header.phi.num_srcs = exec_list_length(&phi->srcs); in write_phi()
1471 write_def(ctx, &phi->def, header, phi->instr.type); in write_phi()
1474 size_t blob_offset = blob_reserve_uint32(ctx->blob); in write_phi()
1475 ASSERTED size_t blob_offset2 = blob_reserve_uint32(ctx->blob); in write_phi()
1479 .src = src->src.ssa, in write_phi()
1480 .block = src->pred, in write_phi()
1482 util_dynarray_append(&ctx->phi_fixups, write_phi_fixup, fixup); in write_phi()
1489 util_dynarray_foreach(&ctx->phi_fixups, write_phi_fixup, fixup) { in write_fixup_phis()
1490 blob_overwrite_uint32(ctx->blob, fixup->blob_offset, in write_fixup_phis()
1491 write_lookup_object(ctx, fixup->src)); in write_fixup_phis()
1492 blob_overwrite_uint32(ctx->blob, fixup->blob_offset + sizeof(uint32_t), in write_fixup_phis()
1493 write_lookup_object(ctx, fixup->block)); in write_fixup_phis()
1496 util_dynarray_clear(&ctx->phi_fixups); in write_fixup_phis()
1502 nir_phi_instr *phi = nir_phi_instr_create(ctx->nir); in read_phi()
1504 read_def(ctx, &phi->def, &phi->instr, header); in read_phi()
1510 * from the blob for now) don't get inserted into the old shader's use-def in read_phi()
1514 nir_instr_insert_after_block(blk, &phi->instr); in read_phi()
1517 nir_def *def = (nir_def *)(uintptr_t)blob_read_uint32(ctx->blob); in read_phi()
1518 nir_block *pred = (nir_block *)(uintptr_t)blob_read_uint32(ctx->blob); in read_phi()
1525 nir_src_set_parent_instr(&src->src, &phi->instr); in read_phi()
1530 list_add(&src->src.use_link, &ctx->phi_srcs); in read_phi()
1539 list_for_each_entry_safe(nir_phi_src, src, &ctx->phi_srcs, src.use_link) { in read_fixup_phis()
1540 src->pred = read_lookup_object(ctx, (uintptr_t)src->pred); in read_fixup_phis()
1541 src->src.ssa = read_lookup_object(ctx, (uintptr_t)src->src.ssa); in read_fixup_phis()
1544 list_del(&src->src.use_link); in read_fixup_phis()
1546 list_addtail(&src->src.use_link, &src->src.ssa->uses); in read_fixup_phis()
1548 assert(list_is_empty(&ctx->phi_srcs)); in read_fixup_phis()
1555 assert(jmp->type != nir_jump_goto && jmp->type != nir_jump_goto_if); in write_jump()
1557 assert(jmp->type < 4); in write_jump()
1562 header.jump.instr_type = jmp->instr.type; in write_jump()
1563 header.jump.type = jmp->type; in write_jump()
1565 blob_write_uint32(ctx->blob, header.u32); in write_jump()
1575 nir_jump_instr *jmp = nir_jump_instr_create(ctx->nir, header.jump.type); in read_jump()
1582 blob_write_uint32(ctx->blob, write_lookup_object(ctx, call->callee)); in write_call()
1584 for (unsigned i = 0; i < call->num_params; i++) in write_call()
1585 write_src(ctx, &call->params[i]); in write_call()
1592 nir_call_instr *call = nir_call_instr_create(ctx->nir, callee); in read_call()
1594 for (unsigned i = 0; i < call->num_params; i++) in read_call()
1595 read_src(ctx, &call->params[i]); in read_call()
1604 assert(instr->type < 16); in write_instr()
1606 switch (instr->type) { in write_instr()
1632 blob_write_uint32(ctx->blob, instr->type); in write_instr()
1648 header.u32 = blob_read_uint32(ctx->blob); in read_instr()
1654 nir_instr_insert_after_block(block, &read_alu(ctx, header)->instr); in read_instr()
1657 instr = &read_deref(ctx, header)->instr; in read_instr()
1660 instr = &read_intrinsic(ctx, header)->instr; in read_instr()
1663 instr = &read_load_const(ctx, header)->instr; in read_instr()
1666 instr = &read_ssa_undef(ctx, header)->instr; in read_instr()
1669 instr = &read_tex(ctx, header)->instr; in read_instr()
1680 instr = &read_jump(ctx, header)->instr; in read_instr()
1683 instr = &read_call(ctx)->instr; in read_instr()
1699 blob_write_uint32(ctx->blob, exec_list_length(&block->instr_list)); in write_block()
1701 ctx->last_instr_type = ~0; in write_block()
1702 ctx->last_alu_header_offset = 0; in write_block()
1706 ctx->last_instr_type = instr->type; in write_block()
1715 * no two blocks are side-by-side in the IR; It should be empty. in read_block()
1721 unsigned num_instrs = blob_read_uint32(ctx->blob); in read_block()
1736 write_src(ctx, &nif->condition); in write_if()
1737 blob_write_uint8(ctx->blob, nif->control); in write_if()
1739 write_cf_list(ctx, &nif->then_list); in write_if()
1740 write_cf_list(ctx, &nif->else_list); in write_if()
1746 nir_if *nif = nir_if_create(ctx->nir); in read_if()
1748 read_src(ctx, &nif->condition); in read_if()
1749 nif->control = blob_read_uint8(ctx->blob); in read_if()
1751 nir_cf_node_insert_end(cf_list, &nif->cf_node); in read_if()
1753 read_cf_list(ctx, &nif->then_list); in read_if()
1754 read_cf_list(ctx, &nif->else_list); in read_if()
1760 blob_write_uint8(ctx->blob, loop->control); in write_loop()
1761 blob_write_uint8(ctx->blob, loop->divergent); in write_loop()
1763 blob_write_uint8(ctx->blob, has_continue_construct); in write_loop()
1765 write_cf_list(ctx, &loop->body); in write_loop()
1767 write_cf_list(ctx, &loop->continue_list); in write_loop()
1774 nir_loop *loop = nir_loop_create(ctx->nir); in read_loop()
1776 nir_cf_node_insert_end(cf_list, &loop->cf_node); in read_loop()
1778 loop->control = blob_read_uint8(ctx->blob); in read_loop()
1779 loop->divergent = blob_read_uint8(ctx->blob); in read_loop()
1780 bool has_continue_construct = blob_read_uint8(ctx->blob); in read_loop()
1782 read_cf_list(ctx, &loop->body); in read_loop()
1785 read_cf_list(ctx, &loop->continue_list); in read_loop()
1792 blob_write_uint32(ctx->blob, cf->type); in write_cf_node()
1794 switch (cf->type) { in write_cf_node()
1812 nir_cf_node_type type = blob_read_uint32(ctx->blob); in read_cf_node()
1832 blob_write_uint32(ctx->blob, exec_list_length(cf_list)); in write_cf_list()
1841 uint32_t num_cf_nodes = blob_read_uint32(ctx->blob); in read_cf_list()
1849 blob_write_uint8(ctx->blob, fi->structured); in write_function_impl()
1850 blob_write_uint8(ctx->blob, !!fi->preamble); in write_function_impl()
1852 if (fi->preamble) in write_function_impl()
1853 blob_write_uint32(ctx->blob, write_lookup_object(ctx, fi->preamble)); in write_function_impl()
1855 write_var_list(ctx, &fi->locals); in write_function_impl()
1857 write_cf_list(ctx, &fi->body); in write_function_impl()
1864 nir_function_impl *fi = nir_function_impl_create_bare(ctx->nir); in read_function_impl()
1866 fi->structured = blob_read_uint8(ctx->blob); in read_function_impl()
1867 bool preamble = blob_read_uint8(ctx->blob); in read_function_impl()
1870 fi->preamble = read_object(ctx); in read_function_impl()
1872 read_var_list(ctx, &fi->locals); in read_function_impl()
1874 read_cf_list(ctx, &fi->body); in read_function_impl()
1877 fi->valid_metadata = 0; in read_function_impl()
1886 if (fxn->is_entrypoint) in write_function()
1888 if (fxn->is_preamble) in write_function()
1890 if (fxn->name) in write_function()
1892 if (fxn->impl) in write_function()
1894 if (fxn->should_inline) in write_function()
1896 if (fxn->dont_inline) in write_function()
1898 blob_write_uint32(ctx->blob, flags); in write_function()
1899 if (fxn->name) in write_function()
1900 blob_write_string(ctx->blob, fxn->name); in write_function()
1904 blob_write_uint32(ctx->blob, fxn->num_params); in write_function()
1905 for (unsigned i = 0; i < fxn->num_params; i++) { in write_function()
1907 ((uint32_t)fxn->params[i].num_components) | in write_function()
1908 ((uint32_t)fxn->params[i].bit_size) << 8; in write_function()
1909 blob_write_uint32(ctx->blob, val); in write_function()
1922 uint32_t flags = blob_read_uint32(ctx->blob); in read_function()
1924 char *name = has_name ? blob_read_string(ctx->blob) : NULL; in read_function()
1926 nir_function *fxn = nir_function_create(ctx->nir, name); in read_function()
1930 fxn->num_params = blob_read_uint32(ctx->blob); in read_function()
1931 fxn->params = ralloc_array(fxn, nir_parameter, fxn->num_params); in read_function()
1932 for (unsigned i = 0; i < fxn->num_params; i++) { in read_function()
1933 uint32_t val = blob_read_uint32(ctx->blob); in read_function()
1934 fxn->params[i].num_components = val & 0xff; in read_function()
1935 fxn->params[i].bit_size = (val >> 8) & 0xff; in read_function()
1938 fxn->is_entrypoint = flags & 0x1; in read_function()
1939 fxn->is_preamble = flags & 0x2; in read_function()
1941 fxn->impl = NIR_SERIALIZE_FUNC_HAS_IMPL; in read_function()
1942 fxn->should_inline = flags & 0x10; in read_function()
1943 fxn->dont_inline = flags & 0x20; in read_function()
1950 blob_write_uint32(ctx->blob, 0); in write_xfb_info()
1952 size_t size = nir_xfb_info_size(xfb->output_count); in write_xfb_info()
1954 blob_write_uint32(ctx->blob, size); in write_xfb_info()
1955 blob_write_bytes(ctx->blob, xfb, size); in write_xfb_info()
1962 uint32_t size = blob_read_uint32(ctx->blob); in read_xfb_info()
1966 struct nir_xfb_info *xfb = ralloc_size(ctx->nir, size); in read_xfb_info()
1967 blob_copy_bytes(ctx->blob, (void *)xfb, size); in read_xfb_info()
1991 struct shader_info info = nir->info; in nir_serialize()
2005 write_var_list(&ctx, &nir->variables); in nir_serialize()
2007 blob_write_uint32(blob, nir->num_inputs); in nir_serialize()
2008 blob_write_uint32(blob, nir->num_uniforms); in nir_serialize()
2009 blob_write_uint32(blob, nir->num_outputs); in nir_serialize()
2010 blob_write_uint32(blob, nir->scratch_size); in nir_serialize()
2012 blob_write_uint32(blob, exec_list_length(&nir->functions)); in nir_serialize()
2021 blob_write_uint32(blob, nir->constant_data_size); in nir_serialize()
2022 if (nir->constant_data_size > 0) in nir_serialize()
2023 blob_write_bytes(blob, nir->constant_data, nir->constant_data_size); in nir_serialize()
2025 write_xfb_info(&ctx, nir->xfb_info); in nir_serialize()
2027 if (nir->info.uses_printf) in nir_serialize()
2028 nir_serialize_printf_info(blob, nir->printf_info, nir->printf_info_count); in nir_serialize()
2059 ctx.nir->info = info; in nir_deserialize()
2061 read_var_list(&ctx, &ctx.nir->variables); in nir_deserialize()
2063 ctx.nir->num_inputs = blob_read_uint32(blob); in nir_deserialize()
2064 ctx.nir->num_uniforms = blob_read_uint32(blob); in nir_deserialize()
2065 ctx.nir->num_outputs = blob_read_uint32(blob); in nir_deserialize()
2066 ctx.nir->scratch_size = blob_read_uint32(blob); in nir_deserialize()
2073 if (fxn->impl == NIR_SERIALIZE_FUNC_HAS_IMPL) in nir_deserialize()
2077 ctx.nir->constant_data_size = blob_read_uint32(blob); in nir_deserialize()
2078 if (ctx.nir->constant_data_size > 0) { in nir_deserialize()
2079 ctx.nir->constant_data = in nir_deserialize()
2080 ralloc_size(ctx.nir, ctx.nir->constant_data_size); in nir_deserialize()
2081 blob_copy_bytes(blob, ctx.nir->constant_data, in nir_deserialize()
2082 ctx.nir->constant_data_size); in nir_deserialize()
2085 ctx.nir->xfb_info = read_xfb_info(&ctx); in nir_deserialize()
2087 if (ctx.nir->info.uses_printf) { in nir_deserialize()
2088 ctx.nir->printf_info = in nir_deserialize()
2090 &ctx.nir->printf_info_count); in nir_deserialize()
2103 const struct nir_shader_compiler_options *options = shader->options; in nir_shader_serialize_deserialize()
2134 blob_write_uint32(blob, info->num_args); in nir_serialize_printf_info()
2135 blob_write_uint32(blob, info->string_size); in nir_serialize_printf_info()
2136 blob_write_bytes(blob, info->arg_sizes, in nir_serialize_printf_info()
2137 info->num_args * sizeof(info->arg_sizes[0])); in nir_serialize_printf_info()
2140 blob_write_bytes(blob, info->strings, info->string_size); in nir_serialize_printf_info()
2156 info->num_args = blob_read_uint32(blob); in nir_deserialize_printf_info()
2157 info->string_size = blob_read_uint32(blob); in nir_deserialize_printf_info()
2158 info->arg_sizes = ralloc_array(mem_ctx, unsigned, info->num_args); in nir_deserialize_printf_info()
2159 blob_copy_bytes(blob, info->arg_sizes, in nir_deserialize_printf_info()
2160 info->num_args * sizeof(info->arg_sizes[0])); in nir_deserialize_printf_info()
2161 info->strings = ralloc_array(mem_ctx, char, info->string_size); in nir_deserialize_printf_info()
2162 blob_copy_bytes(blob, info->strings, info->string_size); in nir_deserialize_printf_info()