uint64_t tes_patch_inputs_read;
unsigned tcs_vertices_out;
uint32_t num_patches;
- uint32_t lds_size;
+ uint32_t num_lds_blocks;
uint8_t num_linked_inputs;
uint8_t num_linked_outputs;
uint8_t num_linked_patch_outputs;
}
static inline unsigned
-calculate_tess_lds_size(unsigned tcs_num_input_vertices,
+calculate_tess_lds_size(enum chip_class chip_class,
+ unsigned tcs_num_input_vertices,
unsigned tcs_num_output_vertices,
unsigned tcs_num_inputs,
unsigned tcs_num_patches,
unsigned output_patch0_offset = input_patch_size * tcs_num_patches;
- return output_patch0_offset + output_patch_size * tcs_num_patches;
+ unsigned lds_size = output_patch0_offset + output_patch_size * tcs_num_patches;
+
+ if (chip_class >= GFX7) {
+ assert(lds_size <= 65536);
+ lds_size = align(lds_size, 512) / 512;
+ } else {
+ assert(lds_size <= 32768);
+ lds_size = align(lds_size, 256) / 256;
+ }
+
+ return lds_size;
}
static inline unsigned