Lines Matching +full:non +full:- +full:live

30  * the general-purpose DMA mode) or reading system memory it shouldn't
31 * (reading it as a texture, uniform data, or direct-addressed TMU
109 return 64 + waddr - QPU_W_ACC0; in waddr_to_live_reg_index()
159 uint32_t s = validated_shader->num_texture_samples; in record_texture_sample()
163 temp_samples = krealloc(validated_shader->texture_samples, in record_texture_sample()
170 &validation_state->tmu_setup[tmu], in record_texture_sample()
173 validated_shader->num_texture_samples = s + 1; in record_texture_sample()
174 validated_shader->texture_samples = temp_samples; in record_texture_sample()
177 validation_state->tmu_setup[tmu].p_offset[i] = ~0; in record_texture_sample()
187 uint64_t inst = validation_state->shader[validation_state->ip]; in check_tmu_write()
195 bool is_direct = submit && validation_state->tmu_write_count[tmu] == 0; in check_tmu_write()
227 clamp_offset = validation_state->live_min_clamp_offsets[clamp_reg]; in check_tmu_write()
236 validation_state->tmu_setup[tmu].p_offset[1] = in check_tmu_write()
245 validation_state->tmu_setup[tmu].is_direct = true; in check_tmu_write()
255 if (validation_state->tmu_write_count[tmu] >= 4) { in check_tmu_write()
260 validation_state->tmu_setup[tmu].p_offset[validation_state->tmu_write_count[tmu]] = in check_tmu_write()
261 validated_shader->uniforms_size; in check_tmu_write()
262 validation_state->tmu_write_count[tmu]++; in check_tmu_write()
267 if (validation_state->needs_uniform_address_update) { in check_tmu_write()
272 validated_shader->uniforms_size += 4; in check_tmu_write()
281 validation_state->tmu_write_count[tmu] = 0; in check_tmu_write()
289 uint32_t o = validated_shader->num_uniform_addr_offsets; in require_uniform_address_uniform()
290 uint32_t num_uniforms = validated_shader->uniforms_size / 4; in require_uniform_address_uniform()
292 validated_shader->uniform_addr_offsets = in require_uniform_address_uniform()
293 krealloc(validated_shader->uniform_addr_offsets, in require_uniform_address_uniform()
295 sizeof(*validated_shader->uniform_addr_offsets), in require_uniform_address_uniform()
297 if (!validated_shader->uniform_addr_offsets) in require_uniform_address_uniform()
300 validated_shader->uniform_addr_offsets[o] = num_uniforms; in require_uniform_address_uniform()
301 validated_shader->num_uniform_addr_offsets++; in require_uniform_address_uniform()
311 uint64_t inst = validation_state->shader[validation_state->ip]; in validate_uniform_address_write()
319 u32 expected_offset = validated_shader->uniforms_size + 4; in validate_uniform_address_write()
360 if (add_lri == -1) { in validate_uniform_address_write()
366 if (validation_state->live_immediates[add_lri] != expected_offset) { in validate_uniform_address_write()
368 validation_state->live_immediates[add_lri], in validate_uniform_address_write()
380 validation_state->needs_uniform_address_update = false; in validate_uniform_address_write()
381 validation_state->needs_uniform_address_for_loop = false; in validate_uniform_address_write()
390 uint64_t inst = validation_state->shader[validation_state->ip]; in check_reg_write()
399 if (lri != -1) { in check_reg_write()
407 validation_state->live_immediates[lri] = in check_reg_write()
410 validation_state->live_immediates[lri] = ~0; in check_reg_write()
414 validation_state->all_registers_used = true; in check_reg_write()
481 uint64_t inst = validation_state->shader[validation_state->ip]; in track_live_clamps()
495 /* Check whether OP_ADD's A argumennt comes from a live MAX(x, 0), in track_live_clamps()
496 * before we clear previous live state. in track_live_clamps()
500 validation_state->live_max_clamp_regs[lri_add_a]); in track_live_clamps()
502 /* Clear live state for registers written by our instruction. */ in track_live_clamps()
506 validation_state->live_max_clamp_regs[lri_mul] = false; in track_live_clamps()
507 validation_state->live_min_clamp_offsets[lri_mul] = ~0; in track_live_clamps()
510 validation_state->live_max_clamp_regs[lri_add] = false; in track_live_clamps()
511 validation_state->live_min_clamp_offsets[lri_add] = ~0; in track_live_clamps()
513 /* Nothing further to do for live tracking, since only ADDs in track_live_clamps()
514 * generate new live clamp registers. in track_live_clamps()
519 /* Now, handle remaining live clamp tracking for the ADD operation. */ in track_live_clamps()
525 /* Track live clamps of a value to a minimum of 0 (in either in track_live_clamps()
533 validation_state->live_max_clamp_regs[lri_add] = true; in track_live_clamps()
535 /* Track live clamps of a value clamped to a minimum of 0 and in track_live_clamps()
547 validation_state->live_min_clamp_offsets[lri_add] = in track_live_clamps()
548 validated_shader->uniforms_size; in track_live_clamps()
556 uint64_t inst = validation_state->shader[validation_state->ip]; in check_instruction_writes()
585 validation_state->needs_uniform_address_for_loop = true; in check_branch()
592 validation_state->ip); in check_branch()
603 uint64_t inst = validation_state->shader[validation_state->ip]; in check_instruction_reads()
614 validated_shader->uniforms_size += 4; in check_instruction_reads()
616 if (validation_state->needs_uniform_address_update) { in check_instruction_reads()
625 validation_state->all_registers_used = true; in check_instruction_reads()
639 int last_branch = -2; in vc4_validate_branches()
641 for (ip = 0; ip < validation_state->max_ip; ip++) { in vc4_validate_branches()
642 uint64_t inst = validation_state->shader[ip]; in vc4_validate_branches()
651 * finished. validation_state->max_ip is the in vc4_validate_branches()
655 validation_state->max_ip = ip + 3; in vc4_validate_branches()
662 if (ip - last_branch < 4) { in vc4_validate_branches()
690 if (branch_target_ip >= validation_state->max_ip) { in vc4_validate_branches()
693 validation_state->max_ip); in vc4_validate_branches()
696 set_bit(branch_target_ip, validation_state->branch_targets); in vc4_validate_branches()
698 /* Make sure that the non-branching path is also not outside in vc4_validate_branches()
701 if (after_delay_ip >= validation_state->max_ip) { in vc4_validate_branches()
704 ip, after_delay_ip, validation_state->max_ip); in vc4_validate_branches()
707 set_bit(after_delay_ip, validation_state->branch_targets); in vc4_validate_branches()
711 if (max_branch_target > validation_state->max_ip - 3) { in vc4_validate_branches()
728 validation_state->tmu_setup[i / 4].p_offset[i % 4] = ~0; in reset_validation_state()
731 validation_state->live_min_clamp_offsets[i] = ~0; in reset_validation_state()
732 validation_state->live_max_clamp_regs[i] = false; in reset_validation_state()
733 validation_state->live_immediates[i] = ~0; in reset_validation_state()
740 return (validation_state->tmu_write_count[0] != 0 || in texturing_in_progress()
741 validation_state->tmu_write_count[1] != 0); in texturing_in_progress()
747 uint32_t ip = validation_state->ip; in vc4_handle_branch_target()
749 if (!test_bit(ip, validation_state->branch_targets)) in vc4_handle_branch_target()
757 /* Reset our live values tracking, since this instruction may have in vc4_handle_branch_target()
761 * example, all predecessors have a live max clamp in the same in vc4_handle_branch_target()
771 * validation, or a one-off the end-of-program check. in vc4_handle_branch_target()
773 validation_state->needs_uniform_address_update = true; in vc4_handle_branch_target()
781 struct vc4_dev *vc4 = to_vc4_dev(shader_obj->base.dev); in vc4_validate_shader()
784 uint32_t last_thread_switch_ip = -3; in vc4_validate_shader()
789 if (WARN_ON_ONCE(vc4->is_vc5)) in vc4_validate_shader()
793 validation_state.shader = shader_obj->vaddr; in vc4_validate_shader()
794 validation_state.max_ip = shader_obj->base.size / sizeof(uint64_t); in vc4_validate_shader()
821 /* Reset r0-r3 live clamp data */ in vc4_validate_shader()
859 validated_shader->is_threaded = true; in vc4_validate_shader()
907 shader_obj->base.size); in vc4_validate_shader()
912 if (validated_shader->is_threaded && in vc4_validate_shader()
931 validated_shader->uniforms_size += 4; in vc4_validate_shader()
935 * scenario is 8 bytes of uniforms plus handles per 8-byte in vc4_validate_shader()
938 validated_shader->uniforms_src_size = in vc4_validate_shader()
939 (validated_shader->uniforms_size + in vc4_validate_shader()
940 4 * validated_shader->num_texture_samples); in vc4_validate_shader()
949 kfree(validated_shader->uniform_addr_offsets); in vc4_validate_shader()
950 kfree(validated_shader->texture_samples); in vc4_validate_shader()