Lines Matching refs:cs
231 void cs_get(struct hl_cs *cs) in cs_get() argument
233 kref_get(&cs->refcount); in cs_get()
236 static int cs_get_unless_zero(struct hl_cs *cs) in cs_get_unless_zero() argument
238 return kref_get_unless_zero(&cs->refcount); in cs_get_unless_zero()
241 static void cs_put(struct hl_cs *cs) in cs_put() argument
243 kref_put(&cs->refcount, cs_do_release); in cs_put()
258 bool cs_needs_completion(struct hl_cs *cs) in cs_needs_completion() argument
263 if (cs->staged_cs && !cs->staged_last) in cs_needs_completion()
269 bool cs_needs_timeout(struct hl_cs *cs) in cs_needs_timeout() argument
274 if (cs->staged_cs && !cs->staged_first) in cs_needs_timeout()
309 parser.ctx_id = job->cs->ctx->asid; in cs_parser()
310 parser.cs_sequence = job->cs->sequence; in cs_parser()
321 parser.completion = cs_needs_completion(job->cs); in cs_parser()
350 struct hl_cs *cs = job->cs; in hl_complete_job() local
381 spin_lock(&cs->job_lock); in hl_complete_job()
383 spin_unlock(&cs->job_lock); in hl_complete_job()
399 if (cs_needs_completion(cs) && in hl_complete_job()
401 cs_put(cs); in hl_complete_job()
418 struct hl_cs *cs; in hl_staged_cs_find_first() local
420 list_for_each_entry_reverse(cs, &hdev->cs_mirror_list, mirror_node) in hl_staged_cs_find_first()
421 if (cs->staged_cs && cs->staged_first && in hl_staged_cs_find_first()
422 cs->sequence == cs_seq) in hl_staged_cs_find_first()
423 return cs; in hl_staged_cs_find_first()
435 bool is_staged_cs_last_exists(struct hl_device *hdev, struct hl_cs *cs) in is_staged_cs_last_exists() argument
439 last_entry = list_last_entry(&cs->staged_cs_node, struct hl_cs, in is_staged_cs_last_exists()
458 static void staged_cs_get(struct hl_device *hdev, struct hl_cs *cs) in staged_cs_get() argument
465 if (!cs->staged_last) in staged_cs_get()
466 cs_get(cs); in staged_cs_get()
477 static void staged_cs_put(struct hl_device *hdev, struct hl_cs *cs) in staged_cs_put() argument
482 if (!cs_needs_completion(cs)) in staged_cs_put()
483 cs_put(cs); in staged_cs_put()
486 static void cs_handle_tdr(struct hl_device *hdev, struct hl_cs *cs) in cs_handle_tdr() argument
490 if (!cs_needs_timeout(cs)) in cs_handle_tdr()
503 if (cs->staged_cs && cs->staged_last) { in cs_handle_tdr()
504 first_cs = hl_staged_cs_find_first(hdev, cs->staged_sequence); in cs_handle_tdr()
506 cs = first_cs; in cs_handle_tdr()
514 if (cs->timedout || hdev->timeout_jiffies == MAX_SCHEDULE_TIMEOUT) in cs_handle_tdr()
517 if (cs->tdr_active) in cs_handle_tdr()
518 cancel_delayed_work_sync(&cs->work_tdr); in cs_handle_tdr()
586 static void complete_multi_cs(struct hl_device *hdev, struct hl_cs *cs) in complete_multi_cs() argument
588 struct hl_fence *fence = cs->fence; in complete_multi_cs()
592 if (cs->staged_cs && !cs->staged_first) in complete_multi_cs()
636 struct hl_cs *cs, in cs_release_sob_reset_handler() argument
643 if (!hl_cs_cmpl->hw_sob || !cs->submitted) in cs_release_sob_reset_handler()
676 struct hl_cs *cs = container_of(ref, struct hl_cs, refcount); in cs_do_release() local
677 struct hl_device *hdev = cs->ctx->hdev; in cs_do_release()
680 container_of(cs->fence, struct hl_cs_compl, base_fence); in cs_do_release()
682 cs->completed = true; in cs_do_release()
692 list_for_each_entry_safe(job, tmp, &cs->job_list, cs_node) in cs_do_release()
695 if (!cs->submitted) { in cs_do_release()
701 if (cs->type == CS_TYPE_WAIT || in cs_do_release()
702 cs->type == CS_TYPE_COLLECTIVE_WAIT) in cs_do_release()
703 hl_fence_put(cs->signal_fence); in cs_do_release()
709 hl_hw_queue_update_ci(cs); in cs_do_release()
713 list_del_init(&cs->mirror_node); in cs_do_release()
716 cs_handle_tdr(hdev, cs); in cs_do_release()
718 if (cs->staged_cs) { in cs_do_release()
722 if (cs->staged_last) { in cs_do_release()
726 &cs->staged_cs_node, staged_cs_node) in cs_do_release()
734 if (cs->submitted) { in cs_do_release()
736 list_del(&cs->staged_cs_node); in cs_do_release()
748 if ((cs->type == CS_TYPE_WAIT || cs->type == CS_TYPE_COLLECTIVE_WAIT) in cs_do_release()
749 && cs->encaps_signals) in cs_do_release()
750 kref_put(&cs->encaps_sig_hdl->refcount, in cs_do_release()
757 hl_debugfs_remove_cs(cs); in cs_do_release()
759 hdev->shadow_cs_queue[cs->sequence & (hdev->asic_prop.max_pending_cs - 1)] = NULL; in cs_do_release()
765 if (cs->timedout) in cs_do_release()
766 cs->fence->error = -ETIMEDOUT; in cs_do_release()
767 else if (cs->aborted) in cs_do_release()
768 cs->fence->error = -EIO; in cs_do_release()
769 else if (!cs->submitted) in cs_do_release()
770 cs->fence->error = -EBUSY; in cs_do_release()
772 if (unlikely(cs->skip_reset_on_timeout)) { in cs_do_release()
775 cs->sequence, in cs_do_release()
776 div_u64(jiffies - cs->submission_time_jiffies, HZ)); in cs_do_release()
779 if (cs->timestamp) { in cs_do_release()
780 cs->fence->timestamp = ktime_get(); in cs_do_release()
781 hl_push_cs_outcome(hdev, &cs->ctx->outcome_store, cs->sequence, in cs_do_release()
782 cs->fence->timestamp, cs->fence->error); in cs_do_release()
785 hl_ctx_put(cs->ctx); in cs_do_release()
787 complete_all(&cs->fence->completion); in cs_do_release()
788 complete_multi_cs(hdev, cs); in cs_do_release()
790 cs_release_sob_reset_handler(hdev, cs, hl_cs_cmpl); in cs_do_release()
792 hl_fence_put(cs->fence); in cs_do_release()
794 kfree(cs->jobs_in_queue_cnt); in cs_do_release()
795 kfree(cs); in cs_do_release()
803 struct hl_cs *cs = container_of(work, struct hl_cs, in cs_timedout() local
805 bool skip_reset_on_timeout = cs->skip_reset_on_timeout, device_reset = false; in cs_timedout()
807 rc = cs_get_unless_zero(cs); in cs_timedout()
811 if ((!cs->submitted) || (cs->completed)) { in cs_timedout()
812 cs_put(cs); in cs_timedout()
816 hdev = cs->ctx->hdev; in cs_timedout()
825 cs->timedout = true; in cs_timedout()
832 hdev->captured_err_info.cs_timeout.seq = cs->sequence; in cs_timedout()
840 switch (cs->type) { in cs_timedout()
844 cs->sequence); in cs_timedout()
850 cs->sequence); in cs_timedout()
856 cs->sequence); in cs_timedout()
862 cs->sequence); in cs_timedout()
870 cs_put(cs); in cs_timedout()
883 struct hl_cs *cs; in allocate_cs() local
888 cs = kzalloc(sizeof(*cs), GFP_ATOMIC); in allocate_cs()
889 if (!cs) in allocate_cs()
890 cs = kzalloc(sizeof(*cs), GFP_KERNEL); in allocate_cs()
892 if (!cs) { in allocate_cs()
901 cs->ctx = ctx; in allocate_cs()
902 cs->submitted = false; in allocate_cs()
903 cs->completed = false; in allocate_cs()
904 cs->type = cs_type; in allocate_cs()
905 cs->timestamp = !!(flags & HL_CS_FLAGS_TIMESTAMP); in allocate_cs()
906 cs->encaps_signals = !!(flags & HL_CS_FLAGS_ENCAP_SIGNALS); in allocate_cs()
907 cs->timeout_jiffies = timeout; in allocate_cs()
908 cs->skip_reset_on_timeout = in allocate_cs()
911 cs->submission_time_jiffies = jiffies; in allocate_cs()
912 INIT_LIST_HEAD(&cs->job_list); in allocate_cs()
913 INIT_DELAYED_WORK(&cs->work_tdr, cs_timedout); in allocate_cs()
914 kref_init(&cs->refcount); in allocate_cs()
915 spin_lock_init(&cs->job_lock); in allocate_cs()
928 cs->jobs_in_queue_cnt = kcalloc(hdev->asic_prop.max_queues, in allocate_cs()
929 sizeof(*cs->jobs_in_queue_cnt), GFP_ATOMIC); in allocate_cs()
930 if (!cs->jobs_in_queue_cnt) in allocate_cs()
931 cs->jobs_in_queue_cnt = kcalloc(hdev->asic_prop.max_queues, in allocate_cs()
932 sizeof(*cs->jobs_in_queue_cnt), GFP_KERNEL); in allocate_cs()
934 if (!cs->jobs_in_queue_cnt) { in allocate_cs()
942 cs_cmpl->type = cs->type; in allocate_cs()
944 cs->fence = &cs_cmpl->base_fence; in allocate_cs()
976 cs->sequence = cs_cmpl->cs_seq; in allocate_cs()
989 *cs_new = cs; in allocate_cs()
995 kfree(cs->jobs_in_queue_cnt); in allocate_cs()
999 kfree(cs); in allocate_cs()
1004 static void cs_rollback(struct hl_device *hdev, struct hl_cs *cs) in cs_rollback() argument
1008 staged_cs_put(hdev, cs); in cs_rollback()
1010 list_for_each_entry_safe(job, tmp, &cs->job_list, cs_node) in cs_rollback()
1017 struct hl_cs *cs, *tmp; in hl_cs_rollback_all() local
1032 list_for_each_entry_safe(cs, tmp, &hdev->cs_mirror_list, mirror_node) { in hl_cs_rollback_all()
1033 cs_get(cs); in hl_cs_rollback_all()
1034 cs->aborted = true; in hl_cs_rollback_all()
1036 cs->ctx->asid, cs->sequence); in hl_cs_rollback_all()
1037 cs_rollback(hdev, cs); in hl_cs_rollback_all()
1038 cs_put(cs); in hl_cs_rollback_all()
1096 struct hl_cs *cs = job->cs; in job_wq_completion() local
1097 struct hl_device *hdev = cs->ctx->hdev; in job_wq_completion()
1105 struct hl_cs *cs = container_of(work, struct hl_cs, finish_work); in cs_completion() local
1106 struct hl_device *hdev = cs->ctx->hdev; in cs_completion()
1109 list_for_each_entry_safe(job, tmp, &cs->job_list, cs_node) in cs_completion()
1346 static int cs_staged_submission(struct hl_device *hdev, struct hl_cs *cs, in cs_staged_submission() argument
1353 cs->staged_last = !!(flags & HL_CS_FLAGS_STAGED_SUBMISSION_LAST); in cs_staged_submission()
1354 cs->staged_first = !!(flags & HL_CS_FLAGS_STAGED_SUBMISSION_FIRST); in cs_staged_submission()
1356 if (cs->staged_first) { in cs_staged_submission()
1358 INIT_LIST_HEAD(&cs->staged_cs_node); in cs_staged_submission()
1359 cs->staged_sequence = cs->sequence; in cs_staged_submission()
1361 if (cs->encaps_signals) in cs_staged_submission()
1362 cs->encaps_sig_hdl_id = encaps_signal_handle; in cs_staged_submission()
1367 cs->staged_sequence = sequence; in cs_staged_submission()
1371 staged_cs_get(hdev, cs); in cs_staged_submission()
1373 cs->staged_cs = true; in cs_staged_submission()
1400 struct hl_cs *cs; in cs_ioctl_default() local
1422 staged_mid ? user_sequence : ULLONG_MAX, &cs, flags, in cs_ioctl_default()
1427 *cs_seq = cs->sequence; in cs_ioctl_default()
1429 hl_debugfs_add_cs(cs); in cs_ioctl_default()
1431 rc = cs_staged_submission(hdev, cs, user_sequence, flags, in cs_ioctl_default()
1439 if (cs->staged_cs) in cs_ioctl_default()
1440 *cs_seq = cs->staged_sequence; in cs_ioctl_default()
1500 job->cs = cs; in cs_ioctl_default()
1505 cs->jobs_in_queue_cnt[job->hw_queue_id]++; in cs_ioctl_default()
1506 cs->jobs_cnt++; in cs_ioctl_default()
1508 list_add_tail(&job->cs_node, &cs->job_list); in cs_ioctl_default()
1516 if (cs_needs_completion(cs) && in cs_ioctl_default()
1519 cs_get(cs); in cs_ioctl_default()
1529 cs->ctx->asid, cs->sequence, job->id, rc); in cs_ioctl_default()
1537 if (int_queues_only && cs_needs_completion(cs)) { in cs_ioctl_default()
1542 cs->ctx->asid, cs->sequence); in cs_ioctl_default()
1548 INIT_WORK(&cs->finish_work, cs_completion); in cs_ioctl_default()
1555 cs->fence->stream_master_qid_map = stream_master_qid_map; in cs_ioctl_default()
1557 rc = hl_hw_queue_schedule_cs(cs); in cs_ioctl_default()
1562 cs->ctx->asid, cs->sequence, rc); in cs_ioctl_default()
1566 *signal_initial_sob_count = cs->initial_sob_count; in cs_ioctl_default()
1575 cs_rollback(hdev, cs); in cs_ioctl_default()
1580 cs_put(cs); in cs_ioctl_default()
1844 struct hl_ctx *ctx, struct hl_cs *cs, in cs_ioctl_signal_wait_create_jobs() argument
1862 if (cs->type == CS_TYPE_WAIT) in cs_ioctl_signal_wait_create_jobs()
1877 job->cs = cs; in cs_ioctl_signal_wait_create_jobs()
1883 if ((cs->type == CS_TYPE_WAIT || cs->type == CS_TYPE_COLLECTIVE_WAIT) in cs_ioctl_signal_wait_create_jobs()
1884 && cs->encaps_signals) in cs_ioctl_signal_wait_create_jobs()
1897 cs_get(cs); in cs_ioctl_signal_wait_create_jobs()
1899 cs->jobs_in_queue_cnt[job->hw_queue_id]++; in cs_ioctl_signal_wait_create_jobs()
1900 cs->jobs_cnt++; in cs_ioctl_signal_wait_create_jobs()
1902 list_add_tail(&job->cs_node, &cs->job_list); in cs_ioctl_signal_wait_create_jobs()
2115 struct hl_cs *cs; in cs_ioctl_signal_wait() local
2275 rc = allocate_cs(hdev, ctx, cs_type, ULLONG_MAX, &cs, flags, timeout); in cs_ioctl_signal_wait()
2290 cs->signal_fence = sig_fence; in cs_ioctl_signal_wait()
2295 if (cs->encaps_signals) in cs_ioctl_signal_wait()
2296 cs->encaps_sig_hdl = encaps_sig_hdl; in cs_ioctl_signal_wait()
2299 hl_debugfs_add_cs(cs); in cs_ioctl_signal_wait()
2301 *cs_seq = cs->sequence; in cs_ioctl_signal_wait()
2304 rc = cs_ioctl_signal_wait_create_jobs(hdev, ctx, cs, q_type, in cs_ioctl_signal_wait()
2308 cs, q_idx, collective_engine_id, in cs_ioctl_signal_wait()
2320 INIT_WORK(&cs->finish_work, cs_completion); in cs_ioctl_signal_wait()
2322 rc = hl_hw_queue_schedule_cs(cs); in cs_ioctl_signal_wait()
2333 ctx->asid, cs->sequence, rc); in cs_ioctl_signal_wait()
2337 *signal_sob_addr_offset = cs->sob_addr_offset; in cs_ioctl_signal_wait()
2338 *signal_initial_sob_count = cs->initial_sob_count; in cs_ioctl_signal_wait()
2346 cs_rollback(hdev, cs); in cs_ioctl_signal_wait()
2351 cs_put(cs); in cs_ioctl_signal_wait()