| /* |
| * |
| * (C) COPYRIGHT 2010-2019 ARM Limited. All rights reserved. |
| * |
| * This program is free software and is provided to you under the terms of the |
| * GNU General Public License version 2 as published by the Free Software |
| * Foundation, and any use by you of this program is subject to the terms |
| * of such GNU licence. |
| * |
| * This program is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| * GNU General Public License for more details. |
| * |
| * You should have received a copy of the GNU General Public License |
| * along with this program; if not, you can access it online at |
| * http://www.gnu.org/licenses/gpl-2.0.html. |
| * |
| * SPDX-License-Identifier: GPL-2.0 |
| * |
| */ |
| |
| |
| |
| #include <linux/dma-buf.h> |
| #ifdef CONFIG_COMPAT |
| #include <linux/compat.h> |
| #endif |
| #include <mali_kbase.h> |
| #include <linux/random.h> |
| #include <linux/version.h> |
| #include <linux/ratelimit.h> |
| |
| #include <mali_kbase_jm.h> |
| #include <mali_kbase_hwaccess_jm.h> |
| #include <mali_kbase_tracepoints.h> |
| |
| #include "mali_kbase_dma_fence.h" |
| |
| #define beenthere(kctx, f, a...) dev_dbg(kctx->kbdev->dev, "%s:" f, __func__, ##a) |
| |
| #if LINUX_VERSION_CODE < KERNEL_VERSION(3, 8, 0) |
| /* random32 was renamed to prandom_u32 in 3.8 */ |
| #define prandom_u32 random32 |
| #endif |
| |
| /* Return whether katom will run on the GPU or not. Currently only soft jobs and |
| * dependency-only atoms do not run on the GPU */ |
| #define IS_GPU_ATOM(katom) (!((katom->core_req & BASE_JD_REQ_SOFT_JOB) || \ |
| ((katom->core_req & BASE_JD_REQ_ATOM_TYPE) == \ |
| BASE_JD_REQ_DEP))) |
| /* |
| * This is the kernel side of the API. Only entry points are: |
| * - kbase_jd_submit(): Called from userspace to submit a single bag |
| * - kbase_jd_done(): Called from interrupt context to track the |
| * completion of a job. |
| * Callouts: |
| * - to the job manager (enqueue a job) |
| * - to the event subsystem (signals the completion/failure of bag/job-chains). |
| */ |
| |
| static void __user * |
| get_compat_pointer(struct kbase_context *kctx, const u64 p) |
| { |
| #ifdef CONFIG_COMPAT |
| if (kbase_ctx_flag(kctx, KCTX_COMPAT)) |
| return compat_ptr(p); |
| #endif |
| return u64_to_user_ptr(p); |
| } |
| |
| /* Runs an atom, either by handing to the JS or by immediately running it in the case of soft-jobs |
| * |
| * Returns whether the JS needs a reschedule. |
| * |
| * Note that the caller must also check the atom status and |
| * if it is KBASE_JD_ATOM_STATE_COMPLETED must call jd_done_nolock |
| */ |
| static int jd_run_atom(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| |
| KBASE_DEBUG_ASSERT(katom->status != KBASE_JD_ATOM_STATE_UNUSED); |
| |
| if ((katom->core_req & BASE_JD_REQ_ATOM_TYPE) == BASE_JD_REQ_DEP) { |
| /* Dependency only atom */ |
| katom->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| return 0; |
| } else if (katom->core_req & BASE_JD_REQ_SOFT_JOB) { |
| /* Soft-job */ |
| if (katom->will_fail_event_code) { |
| kbase_finish_soft_job(katom); |
| katom->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| return 0; |
| } |
| if (kbase_process_soft_job(katom) == 0) { |
| kbase_finish_soft_job(katom); |
| katom->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| } |
| return 0; |
| } |
| |
| katom->status = KBASE_JD_ATOM_STATE_IN_JS; |
| /* Queue an action about whether we should try scheduling a context */ |
| return kbasep_js_add_job(kctx, katom); |
| } |
| |
| #if defined(CONFIG_MALI_DMA_FENCE) |
| void kbase_jd_dep_clear_locked(struct kbase_jd_atom *katom) |
| { |
| struct kbase_device *kbdev; |
| |
| KBASE_DEBUG_ASSERT(katom); |
| kbdev = katom->kctx->kbdev; |
| KBASE_DEBUG_ASSERT(kbdev); |
| |
| /* Check whether the atom's other dependencies were already met. If |
| * katom is a GPU atom then the job scheduler may be able to represent |
| * the dependencies, hence we may attempt to submit it before they are |
| * met. Other atoms must have had both dependencies resolved. |
| */ |
| if (IS_GPU_ATOM(katom) || |
| (!kbase_jd_katom_dep_atom(&katom->dep[0]) && |
| !kbase_jd_katom_dep_atom(&katom->dep[1]))) { |
| /* katom dep complete, attempt to run it */ |
| bool resched = false; |
| |
| resched = jd_run_atom(katom); |
| |
| if (katom->status == KBASE_JD_ATOM_STATE_COMPLETED) { |
| /* The atom has already finished */ |
| resched |= jd_done_nolock(katom, NULL); |
| } |
| |
| if (resched) |
| kbase_js_sched_all(kbdev); |
| } |
| } |
| #endif |
| |
| void kbase_jd_free_external_resources(struct kbase_jd_atom *katom) |
| { |
| #ifdef CONFIG_MALI_DMA_FENCE |
| /* Flush dma-fence workqueue to ensure that any callbacks that may have |
| * been queued are done before continuing. |
| * Any successfully completed atom would have had all it's callbacks |
| * completed before the atom was run, so only flush for failed atoms. |
| */ |
| if (katom->event_code != BASE_JD_EVENT_DONE) |
| flush_workqueue(katom->kctx->dma_fence.wq); |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| } |
| |
| static void kbase_jd_post_external_resources(struct kbase_jd_atom *katom) |
| { |
| KBASE_DEBUG_ASSERT(katom); |
| KBASE_DEBUG_ASSERT(katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES); |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| kbase_dma_fence_signal(katom); |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| kbase_gpu_vm_lock(katom->kctx); |
| /* only roll back if extres is non-NULL */ |
| if (katom->extres) { |
| u32 res_no; |
| |
| res_no = katom->nr_extres; |
| while (res_no-- > 0) { |
| struct kbase_mem_phy_alloc *alloc = katom->extres[res_no].alloc; |
| struct kbase_va_region *reg; |
| |
| reg = kbase_region_tracker_find_region_base_address( |
| katom->kctx, |
| katom->extres[res_no].gpu_address); |
| kbase_unmap_external_resource(katom->kctx, reg, alloc); |
| } |
| kfree(katom->extres); |
| katom->extres = NULL; |
| } |
| kbase_gpu_vm_unlock(katom->kctx); |
| } |
| |
| /* |
| * Set up external resources needed by this job. |
| * |
| * jctx.lock must be held when this is called. |
| */ |
| |
| static int kbase_jd_pre_external_resources(struct kbase_jd_atom *katom, const struct base_jd_atom_v2 *user_atom) |
| { |
| int err_ret_val = -EINVAL; |
| u32 res_no; |
| #ifdef CONFIG_MALI_DMA_FENCE |
| struct kbase_dma_fence_resv_info info = { |
| .resv_objs = NULL, |
| .dma_fence_resv_count = 0, |
| .dma_fence_excl_bitmap = NULL |
| }; |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| /* |
| * When both dma-buf fence and Android native sync is enabled, we |
| * disable dma-buf fence for contexts that are using Android native |
| * fences. |
| */ |
| const bool implicit_sync = !kbase_ctx_flag(katom->kctx, |
| KCTX_NO_IMPLICIT_SYNC); |
| #else /* CONFIG_SYNC || CONFIG_SYNC_FILE*/ |
| const bool implicit_sync = true; |
| #endif /* CONFIG_SYNC || CONFIG_SYNC_FILE */ |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| struct base_external_resource *input_extres; |
| |
| KBASE_DEBUG_ASSERT(katom); |
| KBASE_DEBUG_ASSERT(katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES); |
| |
| /* no resources encoded, early out */ |
| if (!katom->nr_extres) |
| return -EINVAL; |
| |
| katom->extres = kmalloc_array(katom->nr_extres, sizeof(*katom->extres), GFP_KERNEL); |
| if (!katom->extres) |
| return -ENOMEM; |
| |
| /* copy user buffer to the end of our real buffer. |
| * Make sure the struct sizes haven't changed in a way |
| * we don't support */ |
| BUILD_BUG_ON(sizeof(*input_extres) > sizeof(*katom->extres)); |
| input_extres = (struct base_external_resource *) |
| (((unsigned char *)katom->extres) + |
| (sizeof(*katom->extres) - sizeof(*input_extres)) * |
| katom->nr_extres); |
| |
| if (copy_from_user(input_extres, |
| get_compat_pointer(katom->kctx, user_atom->extres_list), |
| sizeof(*input_extres) * katom->nr_extres) != 0) { |
| err_ret_val = -EINVAL; |
| goto early_err_out; |
| } |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| if (implicit_sync) { |
| info.resv_objs = kmalloc_array(katom->nr_extres, |
| sizeof(struct reservation_object *), |
| GFP_KERNEL); |
| if (!info.resv_objs) { |
| err_ret_val = -ENOMEM; |
| goto early_err_out; |
| } |
| |
| info.dma_fence_excl_bitmap = |
| kcalloc(BITS_TO_LONGS(katom->nr_extres), |
| sizeof(unsigned long), GFP_KERNEL); |
| if (!info.dma_fence_excl_bitmap) { |
| err_ret_val = -ENOMEM; |
| goto early_err_out; |
| } |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| /* Take the processes mmap lock */ |
| down_read(¤t->mm->mmap_sem); |
| |
| /* need to keep the GPU VM locked while we set up UMM buffers */ |
| kbase_gpu_vm_lock(katom->kctx); |
| for (res_no = 0; res_no < katom->nr_extres; res_no++) { |
| struct base_external_resource *res = &input_extres[res_no]; |
| struct kbase_va_region *reg; |
| struct kbase_mem_phy_alloc *alloc; |
| #ifdef CONFIG_MALI_DMA_FENCE |
| bool exclusive; |
| exclusive = (res->ext_resource & BASE_EXT_RES_ACCESS_EXCLUSIVE) |
| ? true : false; |
| #endif |
| reg = kbase_region_tracker_find_region_enclosing_address( |
| katom->kctx, |
| res->ext_resource & ~BASE_EXT_RES_ACCESS_EXCLUSIVE); |
| /* did we find a matching region object? */ |
| if (kbase_is_region_invalid_or_free(reg)) { |
| /* roll back */ |
| goto failed_loop; |
| } |
| |
| if (!(katom->core_req & BASE_JD_REQ_SOFT_JOB) && |
| (reg->flags & KBASE_REG_PROTECTED)) { |
| katom->atom_flags |= KBASE_KATOM_FLAG_PROTECTED; |
| } |
| |
| alloc = kbase_map_external_resource(katom->kctx, reg, |
| current->mm); |
| if (!alloc) { |
| err_ret_val = -EINVAL; |
| goto failed_loop; |
| } |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| if (implicit_sync && |
| reg->gpu_alloc->type == KBASE_MEM_TYPE_IMPORTED_UMM) { |
| struct reservation_object *resv; |
| |
| resv = reg->gpu_alloc->imported.umm.dma_buf->resv; |
| if (resv) |
| kbase_dma_fence_add_reservation(resv, &info, |
| exclusive); |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| /* finish with updating out array with the data we found */ |
| /* NOTE: It is important that this is the last thing we do (or |
| * at least not before the first write) as we overwrite elements |
| * as we loop and could be overwriting ourself, so no writes |
| * until the last read for an element. |
| * */ |
| katom->extres[res_no].gpu_address = reg->start_pfn << PAGE_SHIFT; /* save the start_pfn (as an address, not pfn) to use fast lookup later */ |
| katom->extres[res_no].alloc = alloc; |
| } |
| /* successfully parsed the extres array */ |
| /* drop the vm lock now */ |
| kbase_gpu_vm_unlock(katom->kctx); |
| |
| /* Release the processes mmap lock */ |
| up_read(¤t->mm->mmap_sem); |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| if (implicit_sync) { |
| if (info.dma_fence_resv_count) { |
| int ret; |
| |
| ret = kbase_dma_fence_wait(katom, &info); |
| if (ret < 0) |
| goto failed_dma_fence_setup; |
| } |
| |
| kfree(info.resv_objs); |
| kfree(info.dma_fence_excl_bitmap); |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| /* all done OK */ |
| return 0; |
| |
| /* error handling section */ |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| failed_dma_fence_setup: |
| /* Lock the processes mmap lock */ |
| down_read(¤t->mm->mmap_sem); |
| |
| /* lock before we unmap */ |
| kbase_gpu_vm_lock(katom->kctx); |
| #endif |
| |
| failed_loop: |
| /* undo the loop work */ |
| while (res_no-- > 0) { |
| struct kbase_mem_phy_alloc *alloc = katom->extres[res_no].alloc; |
| |
| kbase_unmap_external_resource(katom->kctx, NULL, alloc); |
| } |
| kbase_gpu_vm_unlock(katom->kctx); |
| |
| /* Release the processes mmap lock */ |
| up_read(¤t->mm->mmap_sem); |
| |
| early_err_out: |
| kfree(katom->extres); |
| katom->extres = NULL; |
| #ifdef CONFIG_MALI_DMA_FENCE |
| if (implicit_sync) { |
| kfree(info.resv_objs); |
| kfree(info.dma_fence_excl_bitmap); |
| } |
| #endif |
| return err_ret_val; |
| } |
| |
| static inline void jd_resolve_dep(struct list_head *out_list, |
| struct kbase_jd_atom *katom, |
| u8 d, bool ctx_is_dying) |
| { |
| u8 other_d = !d; |
| |
| while (!list_empty(&katom->dep_head[d])) { |
| struct kbase_jd_atom *dep_atom; |
| struct kbase_jd_atom *other_dep_atom; |
| u8 dep_type; |
| |
| dep_atom = list_entry(katom->dep_head[d].next, |
| struct kbase_jd_atom, dep_item[d]); |
| list_del(katom->dep_head[d].next); |
| |
| dep_type = kbase_jd_katom_dep_type(&dep_atom->dep[d]); |
| kbase_jd_katom_dep_clear(&dep_atom->dep[d]); |
| |
| if (katom->event_code != BASE_JD_EVENT_DONE && |
| (dep_type != BASE_JD_DEP_TYPE_ORDER)) { |
| #ifdef CONFIG_MALI_DMA_FENCE |
| kbase_dma_fence_cancel_callbacks(dep_atom); |
| #endif |
| |
| dep_atom->event_code = katom->event_code; |
| KBASE_DEBUG_ASSERT(dep_atom->status != |
| KBASE_JD_ATOM_STATE_UNUSED); |
| |
| dep_atom->will_fail_event_code = dep_atom->event_code; |
| } |
| other_dep_atom = (struct kbase_jd_atom *) |
| kbase_jd_katom_dep_atom(&dep_atom->dep[other_d]); |
| |
| if (!dep_atom->in_jd_list && (!other_dep_atom || |
| (IS_GPU_ATOM(dep_atom) && !ctx_is_dying && |
| !dep_atom->will_fail_event_code && |
| !other_dep_atom->will_fail_event_code))) { |
| bool dep_satisfied = true; |
| #ifdef CONFIG_MALI_DMA_FENCE |
| int dep_count; |
| |
| dep_count = kbase_fence_dep_count_read(dep_atom); |
| if (likely(dep_count == -1)) { |
| dep_satisfied = true; |
| } else { |
| /* |
| * There are either still active callbacks, or |
| * all fences for this @dep_atom has signaled, |
| * but the worker that will queue the atom has |
| * not yet run. |
| * |
| * Wait for the fences to signal and the fence |
| * worker to run and handle @dep_atom. If |
| * @dep_atom was completed due to error on |
| * @katom, then the fence worker will pick up |
| * the complete status and error code set on |
| * @dep_atom above. |
| */ |
| dep_satisfied = false; |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| if (dep_satisfied) { |
| dep_atom->in_jd_list = true; |
| list_add_tail(&dep_atom->jd_item, out_list); |
| } |
| } |
| } |
| } |
| |
| KBASE_EXPORT_TEST_API(jd_resolve_dep); |
| |
| /** |
| * is_dep_valid - Validate that a dependency is valid for early dependency |
| * submission |
| * @katom: Dependency atom to validate |
| * |
| * A dependency is valid if any of the following are true : |
| * - It does not exist (a non-existent dependency does not block submission) |
| * - It is in the job scheduler |
| * - It has completed, does not have a failure event code, and has not been |
| * marked to fail in the future |
| * |
| * Return: true if valid, false otherwise |
| */ |
| static bool is_dep_valid(struct kbase_jd_atom *katom) |
| { |
| /* If there's no dependency then this is 'valid' from the perspective of |
| * early dependency submission */ |
| if (!katom) |
| return true; |
| |
| /* Dependency must have reached the job scheduler */ |
| if (katom->status < KBASE_JD_ATOM_STATE_IN_JS) |
| return false; |
| |
| /* If dependency has completed and has failed or will fail then it is |
| * not valid */ |
| if (katom->status >= KBASE_JD_ATOM_STATE_HW_COMPLETED && |
| (katom->event_code != BASE_JD_EVENT_DONE || |
| katom->will_fail_event_code)) |
| return false; |
| |
| return true; |
| } |
| |
| static void jd_try_submitting_deps(struct list_head *out_list, |
| struct kbase_jd_atom *node) |
| { |
| int i; |
| |
| for (i = 0; i < 2; i++) { |
| struct list_head *pos; |
| |
| list_for_each(pos, &node->dep_head[i]) { |
| struct kbase_jd_atom *dep_atom = list_entry(pos, |
| struct kbase_jd_atom, dep_item[i]); |
| |
| if (IS_GPU_ATOM(dep_atom) && !dep_atom->in_jd_list) { |
| /*Check if atom deps look sane*/ |
| bool dep0_valid = is_dep_valid( |
| dep_atom->dep[0].atom); |
| bool dep1_valid = is_dep_valid( |
| dep_atom->dep[1].atom); |
| bool dep_satisfied = true; |
| #ifdef CONFIG_MALI_DMA_FENCE |
| int dep_count; |
| |
| dep_count = kbase_fence_dep_count_read( |
| dep_atom); |
| if (likely(dep_count == -1)) { |
| dep_satisfied = true; |
| } else { |
| /* |
| * There are either still active callbacks, or |
| * all fences for this @dep_atom has signaled, |
| * but the worker that will queue the atom has |
| * not yet run. |
| * |
| * Wait for the fences to signal and the fence |
| * worker to run and handle @dep_atom. If |
| * @dep_atom was completed due to error on |
| * @katom, then the fence worker will pick up |
| * the complete status and error code set on |
| * @dep_atom above. |
| */ |
| dep_satisfied = false; |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| if (dep0_valid && dep1_valid && dep_satisfied) { |
| dep_atom->in_jd_list = true; |
| list_add(&dep_atom->jd_item, out_list); |
| } |
| } |
| } |
| } |
| } |
| |
| /* |
| * Perform the necessary handling of an atom that has finished running |
| * on the GPU. |
| * |
| * Note that if this is a soft-job that has had kbase_prepare_soft_job called on it then the caller |
| * is responsible for calling kbase_finish_soft_job *before* calling this function. |
| * |
| * The caller must hold the kbase_jd_context.lock. |
| */ |
| bool jd_done_nolock(struct kbase_jd_atom *katom, |
| struct list_head *completed_jobs_ctx) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct kbase_device *kbdev = kctx->kbdev; |
| struct list_head completed_jobs; |
| struct list_head runnable_jobs; |
| bool need_to_try_schedule_context = false; |
| int i; |
| |
| INIT_LIST_HEAD(&completed_jobs); |
| INIT_LIST_HEAD(&runnable_jobs); |
| |
| KBASE_DEBUG_ASSERT(katom->status != KBASE_JD_ATOM_STATE_UNUSED); |
| |
| /* This is needed in case an atom is failed due to being invalid, this |
| * can happen *before* the jobs that the atom depends on have completed */ |
| for (i = 0; i < 2; i++) { |
| if (kbase_jd_katom_dep_atom(&katom->dep[i])) { |
| list_del(&katom->dep_item[i]); |
| kbase_jd_katom_dep_clear(&katom->dep[i]); |
| } |
| } |
| |
| /* With PRLAM-10817 or PRLAM-10959 the last tile of a fragment job being soft-stopped can fail with |
| * BASE_JD_EVENT_TILE_RANGE_FAULT. |
| * |
| * So here if the fragment job failed with TILE_RANGE_FAULT and it has been soft-stopped, then we promote the |
| * error code to BASE_JD_EVENT_DONE |
| */ |
| |
| if ((kbase_hw_has_issue(kbdev, BASE_HW_ISSUE_10817) || kbase_hw_has_issue(kbdev, BASE_HW_ISSUE_10959)) && |
| katom->event_code == BASE_JD_EVENT_TILE_RANGE_FAULT) { |
| if ((katom->core_req & BASE_JD_REQ_FS) && (katom->atom_flags & KBASE_KATOM_FLAG_BEEN_SOFT_STOPPPED)) { |
| /* Promote the failure to job done */ |
| katom->event_code = BASE_JD_EVENT_DONE; |
| katom->atom_flags = katom->atom_flags & (~KBASE_KATOM_FLAG_BEEN_SOFT_STOPPPED); |
| } |
| } |
| |
| katom->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| list_add_tail(&katom->jd_item, &completed_jobs); |
| |
| while (!list_empty(&completed_jobs)) { |
| katom = list_entry(completed_jobs.prev, struct kbase_jd_atom, jd_item); |
| list_del(completed_jobs.prev); |
| KBASE_DEBUG_ASSERT(katom->status == KBASE_JD_ATOM_STATE_COMPLETED); |
| |
| for (i = 0; i < 2; i++) |
| jd_resolve_dep(&runnable_jobs, katom, i, |
| kbase_ctx_flag(kctx, KCTX_DYING)); |
| |
| if (katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES) |
| kbase_jd_post_external_resources(katom); |
| |
| while (!list_empty(&runnable_jobs)) { |
| struct kbase_jd_atom *node; |
| |
| node = list_entry(runnable_jobs.next, |
| struct kbase_jd_atom, jd_item); |
| list_del(runnable_jobs.next); |
| node->in_jd_list = false; |
| |
| KBASE_DEBUG_ASSERT(node->status != KBASE_JD_ATOM_STATE_UNUSED); |
| |
| if (node->status != KBASE_JD_ATOM_STATE_COMPLETED && |
| !kbase_ctx_flag(kctx, KCTX_DYING)) { |
| need_to_try_schedule_context |= jd_run_atom(node); |
| } else { |
| node->event_code = katom->event_code; |
| |
| if (node->core_req & |
| BASE_JD_REQ_SOFT_JOB) { |
| WARN_ON(!list_empty(&node->queue)); |
| kbase_finish_soft_job(node); |
| } |
| node->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| } |
| |
| if (node->status == KBASE_JD_ATOM_STATE_COMPLETED) { |
| list_add_tail(&node->jd_item, &completed_jobs); |
| } else if (node->status == KBASE_JD_ATOM_STATE_IN_JS && |
| !node->will_fail_event_code) { |
| /* Node successfully submitted, try submitting |
| * dependencies as they may now be representable |
| * in JS */ |
| jd_try_submitting_deps(&runnable_jobs, node); |
| } |
| } |
| |
| /* Register a completed job as a disjoint event when the GPU |
| * is in a disjoint state (ie. being reset). |
| */ |
| kbase_disjoint_event_potential(kctx->kbdev); |
| if (completed_jobs_ctx) |
| list_add_tail(&katom->jd_item, completed_jobs_ctx); |
| else |
| kbase_event_post(kctx, katom); |
| |
| /* Decrement and check the TOTAL number of jobs. This includes |
| * those not tracked by the scheduler: 'not ready to run' and |
| * 'dependency-only' jobs. */ |
| if (--kctx->jctx.job_nr == 0) |
| wake_up(&kctx->jctx.zero_jobs_wait); /* All events are safely queued now, and we can signal any waiter |
| * that we've got no more jobs (so we can be safely terminated) */ |
| } |
| |
| return need_to_try_schedule_context; |
| } |
| |
| KBASE_EXPORT_TEST_API(jd_done_nolock); |
| |
| #ifdef CONFIG_GPU_TRACEPOINTS |
| enum { |
| CORE_REQ_DEP_ONLY, |
| CORE_REQ_SOFT, |
| CORE_REQ_COMPUTE, |
| CORE_REQ_FRAGMENT, |
| CORE_REQ_VERTEX, |
| CORE_REQ_TILER, |
| CORE_REQ_FRAGMENT_VERTEX, |
| CORE_REQ_FRAGMENT_VERTEX_TILER, |
| CORE_REQ_FRAGMENT_TILER, |
| CORE_REQ_VERTEX_TILER, |
| CORE_REQ_UNKNOWN |
| }; |
| static const char * const core_req_strings[] = { |
| "Dependency Only Job", |
| "Soft Job", |
| "Compute Shader Job", |
| "Fragment Shader Job", |
| "Vertex/Geometry Shader Job", |
| "Tiler Job", |
| "Fragment Shader + Vertex/Geometry Shader Job", |
| "Fragment Shader + Vertex/Geometry Shader Job + Tiler Job", |
| "Fragment Shader + Tiler Job", |
| "Vertex/Geometry Shader Job + Tiler Job", |
| "Unknown Job" |
| }; |
| static const char *kbasep_map_core_reqs_to_string(base_jd_core_req core_req) |
| { |
| if (core_req & BASE_JD_REQ_SOFT_JOB) |
| return core_req_strings[CORE_REQ_SOFT]; |
| if (core_req & BASE_JD_REQ_ONLY_COMPUTE) |
| return core_req_strings[CORE_REQ_COMPUTE]; |
| switch (core_req & (BASE_JD_REQ_FS | BASE_JD_REQ_CS | BASE_JD_REQ_T)) { |
| case BASE_JD_REQ_DEP: |
| return core_req_strings[CORE_REQ_DEP_ONLY]; |
| case BASE_JD_REQ_FS: |
| return core_req_strings[CORE_REQ_FRAGMENT]; |
| case BASE_JD_REQ_CS: |
| return core_req_strings[CORE_REQ_VERTEX]; |
| case BASE_JD_REQ_T: |
| return core_req_strings[CORE_REQ_TILER]; |
| case (BASE_JD_REQ_FS | BASE_JD_REQ_CS): |
| return core_req_strings[CORE_REQ_FRAGMENT_VERTEX]; |
| case (BASE_JD_REQ_FS | BASE_JD_REQ_T): |
| return core_req_strings[CORE_REQ_FRAGMENT_TILER]; |
| case (BASE_JD_REQ_CS | BASE_JD_REQ_T): |
| return core_req_strings[CORE_REQ_VERTEX_TILER]; |
| case (BASE_JD_REQ_FS | BASE_JD_REQ_CS | BASE_JD_REQ_T): |
| return core_req_strings[CORE_REQ_FRAGMENT_VERTEX_TILER]; |
| } |
| return core_req_strings[CORE_REQ_UNKNOWN]; |
| } |
| #endif |
| |
| bool jd_submit_atom(struct kbase_context *kctx, const struct base_jd_atom_v2 *user_atom, struct kbase_jd_atom *katom) |
| { |
| struct kbase_device *kbdev = kctx->kbdev; |
| struct kbase_jd_context *jctx = &kctx->jctx; |
| int queued = 0; |
| int i; |
| int sched_prio; |
| bool ret; |
| bool will_fail = false; |
| |
| /* Update the TOTAL number of jobs. This includes those not tracked by |
| * the scheduler: 'not ready to run' and 'dependency-only' jobs. */ |
| jctx->job_nr++; |
| |
| #if LINUX_VERSION_CODE < KERNEL_VERSION(4, 10, 0) |
| katom->start_timestamp.tv64 = 0; |
| #else |
| katom->start_timestamp = 0; |
| #endif |
| katom->udata = user_atom->udata; |
| katom->kctx = kctx; |
| katom->nr_extres = user_atom->nr_extres; |
| katom->extres = NULL; |
| katom->device_nr = user_atom->device_nr; |
| katom->jc = user_atom->jc; |
| katom->core_req = user_atom->core_req; |
| katom->jobslot = user_atom->jobslot; |
| katom->atom_flags = 0; |
| katom->retry_count = 0; |
| katom->need_cache_flush_cores_retained = 0; |
| katom->pre_dep = NULL; |
| katom->post_dep = NULL; |
| katom->x_pre_dep = NULL; |
| katom->x_post_dep = NULL; |
| katom->will_fail_event_code = BASE_JD_EVENT_NOT_STARTED; |
| katom->softjob_data = NULL; |
| |
| /* Implicitly sets katom->protected_state.enter as well. */ |
| katom->protected_state.exit = KBASE_ATOM_EXIT_PROTECTED_CHECK; |
| |
| katom->age = kctx->age_count++; |
| |
| INIT_LIST_HEAD(&katom->queue); |
| INIT_LIST_HEAD(&katom->jd_item); |
| #ifdef CONFIG_MALI_DMA_FENCE |
| kbase_fence_dep_count_set(katom, -1); |
| #endif |
| |
| /* Don't do anything if there is a mess up with dependencies. |
| This is done in a separate cycle to check both the dependencies at ones, otherwise |
| it will be extra complexity to deal with 1st dependency ( just added to the list ) |
| if only the 2nd one has invalid config. |
| */ |
| for (i = 0; i < 2; i++) { |
| int dep_atom_number = user_atom->pre_dep[i].atom_id; |
| base_jd_dep_type dep_atom_type = user_atom->pre_dep[i].dependency_type; |
| |
| if (dep_atom_number) { |
| if (dep_atom_type != BASE_JD_DEP_TYPE_ORDER && |
| dep_atom_type != BASE_JD_DEP_TYPE_DATA) { |
| katom->event_code = BASE_JD_EVENT_JOB_CONFIG_FAULT; |
| katom->status = KBASE_JD_ATOM_STATE_COMPLETED; |
| |
| /* Wrong dependency setup. Atom will be sent |
| * back to user space. Do not record any |
| * dependencies. */ |
| KBASE_TLSTREAM_TL_NEW_ATOM( |
| kbdev, |
| katom, |
| kbase_jd_atom_id(kctx, katom)); |
| KBASE_TLSTREAM_TL_RET_ATOM_CTX( |
| kbdev, |
| katom, kctx); |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_STATE( |
| kbdev, |
| katom, |
| TL_ATOM_STATE_IDLE); |
| |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| } |
| } |
| |
| /* Add dependencies */ |
| for (i = 0; i < 2; i++) { |
| int dep_atom_number = user_atom->pre_dep[i].atom_id; |
| base_jd_dep_type dep_atom_type; |
| struct kbase_jd_atom *dep_atom = &jctx->atoms[dep_atom_number]; |
| |
| dep_atom_type = user_atom->pre_dep[i].dependency_type; |
| kbase_jd_katom_dep_clear(&katom->dep[i]); |
| |
| if (!dep_atom_number) |
| continue; |
| |
| if (dep_atom->status == KBASE_JD_ATOM_STATE_UNUSED || |
| dep_atom->status == KBASE_JD_ATOM_STATE_COMPLETED) { |
| |
| if (dep_atom->event_code == BASE_JD_EVENT_DONE) |
| continue; |
| /* don't stop this atom if it has an order dependency |
| * only to the failed one, try to submit it through |
| * the normal path |
| */ |
| if (dep_atom_type == BASE_JD_DEP_TYPE_ORDER && |
| dep_atom->event_code > BASE_JD_EVENT_ACTIVE) { |
| continue; |
| } |
| |
| /* Atom has completed, propagate the error code if any */ |
| katom->event_code = dep_atom->event_code; |
| katom->status = KBASE_JD_ATOM_STATE_QUEUED; |
| |
| /* This atom will be sent back to user space. |
| * Do not record any dependencies. |
| */ |
| KBASE_TLSTREAM_TL_NEW_ATOM( |
| kbdev, |
| katom, |
| kbase_jd_atom_id(kctx, katom)); |
| KBASE_TLSTREAM_TL_RET_ATOM_CTX(kbdev, katom, kctx); |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_STATE(kbdev, katom, |
| TL_ATOM_STATE_IDLE); |
| |
| will_fail = true; |
| |
| } else { |
| /* Atom is in progress, add this atom to the list */ |
| list_add_tail(&katom->dep_item[i], &dep_atom->dep_head[i]); |
| kbase_jd_katom_dep_set(&katom->dep[i], dep_atom, dep_atom_type); |
| queued = 1; |
| } |
| } |
| |
| if (will_fail) { |
| if (!queued) { |
| if (katom->core_req & BASE_JD_REQ_SOFT_JOB) { |
| /* This softjob has failed due to a previous |
| * dependency, however we should still run the |
| * prepare & finish functions |
| */ |
| int err = kbase_prepare_soft_job(katom); |
| |
| if (err >= 0) |
| kbase_finish_soft_job(katom); |
| } |
| |
| ret = jd_done_nolock(katom, NULL); |
| |
| goto out; |
| } else { |
| |
| if (katom->core_req & BASE_JD_REQ_SOFT_JOB) { |
| /* This softjob has failed due to a previous |
| * dependency, however we should still run the |
| * prepare & finish functions |
| */ |
| if (kbase_prepare_soft_job(katom) != 0) { |
| katom->event_code = |
| BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| } |
| |
| katom->will_fail_event_code = katom->event_code; |
| ret = false; |
| |
| goto out; |
| } |
| } else { |
| /* These must occur after the above loop to ensure that an atom |
| * that depends on a previous atom with the same number behaves |
| * as expected */ |
| katom->event_code = BASE_JD_EVENT_DONE; |
| katom->status = KBASE_JD_ATOM_STATE_QUEUED; |
| } |
| |
| /* For invalid priority, be most lenient and choose the default */ |
| sched_prio = kbasep_js_atom_prio_to_sched_prio(user_atom->prio); |
| if (sched_prio == KBASE_JS_ATOM_SCHED_PRIO_INVALID) |
| sched_prio = KBASE_JS_ATOM_SCHED_PRIO_DEFAULT; |
| katom->sched_priority = sched_prio; |
| |
| /* Create a new atom. */ |
| KBASE_TLSTREAM_TL_NEW_ATOM( |
| kbdev, |
| katom, |
| kbase_jd_atom_id(kctx, katom)); |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_STATE(kbdev, katom, TL_ATOM_STATE_IDLE); |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_PRIORITY(kbdev, katom, katom->sched_priority); |
| KBASE_TLSTREAM_TL_RET_ATOM_CTX(kbdev, katom, kctx); |
| |
| /* Reject atoms with job chain = NULL, as these cause issues with soft-stop */ |
| if (!katom->jc && (katom->core_req & BASE_JD_REQ_ATOM_TYPE) != BASE_JD_REQ_DEP) { |
| dev_warn(kctx->kbdev->dev, "Rejecting atom with jc = NULL"); |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| |
| /* Reject atoms with an invalid device_nr */ |
| if ((katom->core_req & BASE_JD_REQ_SPECIFIC_COHERENT_GROUP) && |
| (katom->device_nr >= kctx->kbdev->gpu_props.num_core_groups)) { |
| dev_warn(kctx->kbdev->dev, |
| "Rejecting atom with invalid device_nr %d", |
| katom->device_nr); |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| |
| /* Reject atoms with invalid core requirements */ |
| if ((katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES) && |
| (katom->core_req & BASE_JD_REQ_EVENT_COALESCE)) { |
| dev_warn(kctx->kbdev->dev, |
| "Rejecting atom with invalid core requirements"); |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| katom->core_req &= ~BASE_JD_REQ_EVENT_COALESCE; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| |
| /* Reject soft-job atom of certain types from accessing external resources */ |
| if ((katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES) && |
| (((katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) == BASE_JD_REQ_SOFT_FENCE_WAIT) || |
| ((katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) == BASE_JD_REQ_SOFT_JIT_ALLOC) || |
| ((katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) == BASE_JD_REQ_SOFT_JIT_FREE))) { |
| dev_warn(kctx->kbdev->dev, |
| "Rejecting soft-job atom accessing external resources"); |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| |
| if (katom->core_req & BASE_JD_REQ_EXTERNAL_RESOURCES) { |
| /* handle what we need to do to access the external resources */ |
| if (kbase_jd_pre_external_resources(katom, user_atom) != 0) { |
| /* setup failed (no access, bad resource, unknown resource types, etc.) */ |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| } |
| |
| /* Validate the atom. Function will return error if the atom is |
| * malformed. |
| * |
| * Soft-jobs never enter the job scheduler but have their own initialize method. |
| * |
| * If either fail then we immediately complete the atom with an error. |
| */ |
| if ((katom->core_req & BASE_JD_REQ_SOFT_JOB) == 0) { |
| if (!kbase_js_is_atom_valid(kctx->kbdev, katom)) { |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| } else { |
| /* Soft-job */ |
| if (kbase_prepare_soft_job(katom) != 0) { |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| } |
| |
| #ifdef CONFIG_GPU_TRACEPOINTS |
| katom->work_id = atomic_inc_return(&jctx->work_id); |
| trace_gpu_job_enqueue(kctx->id, katom->work_id, |
| kbasep_map_core_reqs_to_string(katom->core_req)); |
| #endif |
| |
| if (queued && !IS_GPU_ATOM(katom)) { |
| ret = false; |
| goto out; |
| } |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| if (kbase_fence_dep_count_read(katom) != -1) { |
| ret = false; |
| goto out; |
| } |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| |
| if (katom->core_req & BASE_JD_REQ_SOFT_JOB) { |
| if (kbase_process_soft_job(katom) == 0) { |
| kbase_finish_soft_job(katom); |
| ret = jd_done_nolock(katom, NULL); |
| goto out; |
| } |
| |
| ret = false; |
| } else if ((katom->core_req & BASE_JD_REQ_ATOM_TYPE) != BASE_JD_REQ_DEP) { |
| katom->status = KBASE_JD_ATOM_STATE_IN_JS; |
| ret = kbasep_js_add_job(kctx, katom); |
| /* If job was cancelled then resolve immediately */ |
| if (katom->event_code == BASE_JD_EVENT_JOB_CANCELLED) |
| ret = jd_done_nolock(katom, NULL); |
| } else { |
| /* This is a pure dependency. Resolve it immediately */ |
| ret = jd_done_nolock(katom, NULL); |
| } |
| |
| out: |
| return ret; |
| } |
| |
| int kbase_jd_submit(struct kbase_context *kctx, |
| void __user *user_addr, u32 nr_atoms, u32 stride, |
| bool uk6_atom) |
| { |
| struct kbase_jd_context *jctx = &kctx->jctx; |
| int err = 0; |
| int i; |
| bool need_to_try_schedule_context = false; |
| struct kbase_device *kbdev; |
| u32 latest_flush; |
| |
| /* |
| * kbase_jd_submit isn't expected to fail and so all errors with the |
| * jobs are reported by immediately failing them (through event system) |
| */ |
| kbdev = kctx->kbdev; |
| |
| beenthere(kctx, "%s", "Enter"); |
| |
| if (kbase_ctx_flag(kctx, KCTX_SUBMIT_DISABLED)) { |
| dev_err(kbdev->dev, "Attempt to submit to a context that has SUBMIT_DISABLED set on it"); |
| return -EINVAL; |
| } |
| |
| if (stride != sizeof(base_jd_atom_v2)) { |
| dev_err(kbdev->dev, "Stride passed to job_submit doesn't match kernel"); |
| return -EINVAL; |
| } |
| |
| /* All atoms submitted in this call have the same flush ID */ |
| latest_flush = kbase_backend_get_current_flush_id(kbdev); |
| |
| for (i = 0; i < nr_atoms; i++) { |
| struct base_jd_atom_v2 user_atom; |
| struct kbase_jd_atom *katom; |
| |
| if (copy_from_user(&user_atom, user_addr, |
| sizeof(user_atom)) != 0) { |
| err = -EINVAL; |
| break; |
| } |
| |
| user_addr = (void __user *)((uintptr_t) user_addr + stride); |
| |
| mutex_lock(&jctx->lock); |
| #ifndef compiletime_assert |
| #define compiletime_assert_defined |
| #define compiletime_assert(x, msg) do { switch (0) { case 0: case (x):; } } \ |
| while (false) |
| #endif |
| compiletime_assert((1 << (8*sizeof(user_atom.atom_number))) == |
| BASE_JD_ATOM_COUNT, |
| "BASE_JD_ATOM_COUNT and base_atom_id type out of sync"); |
| compiletime_assert(sizeof(user_atom.pre_dep[0].atom_id) == |
| sizeof(user_atom.atom_number), |
| "BASE_JD_ATOM_COUNT and base_atom_id type out of sync"); |
| #ifdef compiletime_assert_defined |
| #undef compiletime_assert |
| #undef compiletime_assert_defined |
| #endif |
| katom = &jctx->atoms[user_atom.atom_number]; |
| |
| /* Record the flush ID for the cache flush optimisation */ |
| katom->flush_id = latest_flush; |
| |
| while (katom->status != KBASE_JD_ATOM_STATE_UNUSED) { |
| /* Atom number is already in use, wait for the atom to |
| * complete |
| */ |
| mutex_unlock(&jctx->lock); |
| |
| /* This thread will wait for the atom to complete. Due |
| * to thread scheduling we are not sure that the other |
| * thread that owns the atom will also schedule the |
| * context, so we force the scheduler to be active and |
| * hence eventually schedule this context at some point |
| * later. |
| */ |
| kbase_js_sched_all(kbdev); |
| |
| if (wait_event_killable(katom->completed, |
| katom->status == |
| KBASE_JD_ATOM_STATE_UNUSED) != 0) { |
| /* We're being killed so the result code |
| * doesn't really matter |
| */ |
| return 0; |
| } |
| mutex_lock(&jctx->lock); |
| } |
| |
| need_to_try_schedule_context |= |
| jd_submit_atom(kctx, &user_atom, katom); |
| |
| /* Register a completed job as a disjoint event when the GPU is in a disjoint state |
| * (ie. being reset). |
| */ |
| kbase_disjoint_event_potential(kbdev); |
| |
| mutex_unlock(&jctx->lock); |
| } |
| |
| if (need_to_try_schedule_context) |
| kbase_js_sched_all(kbdev); |
| |
| return err; |
| } |
| |
| KBASE_EXPORT_TEST_API(kbase_jd_submit); |
| |
| void kbase_jd_done_worker(struct work_struct *data) |
| { |
| struct kbase_jd_atom *katom = container_of(data, struct kbase_jd_atom, work); |
| struct kbase_jd_context *jctx; |
| struct kbase_context *kctx; |
| struct kbasep_js_kctx_info *js_kctx_info; |
| struct kbase_device *kbdev; |
| struct kbasep_js_device_data *js_devdata; |
| u64 cache_jc = katom->jc; |
| struct kbasep_js_atom_retained_state katom_retained_state; |
| bool context_idle; |
| base_jd_core_req core_req = katom->core_req; |
| |
| /* Soft jobs should never reach this function */ |
| KBASE_DEBUG_ASSERT((katom->core_req & BASE_JD_REQ_SOFT_JOB) == 0); |
| |
| kctx = katom->kctx; |
| jctx = &kctx->jctx; |
| kbdev = kctx->kbdev; |
| js_kctx_info = &kctx->jctx.sched_info; |
| js_devdata = &kbdev->js_data; |
| |
| KBASE_TRACE_ADD(kbdev, JD_DONE_WORKER, kctx, katom, katom->jc, 0); |
| |
| kbase_backend_complete_wq(kbdev, katom); |
| |
| /* |
| * Begin transaction on JD context and JS context |
| */ |
| mutex_lock(&jctx->lock); |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_STATE(kbdev, katom, TL_ATOM_STATE_DONE); |
| mutex_lock(&js_devdata->queue_mutex); |
| mutex_lock(&js_kctx_info->ctx.jsctx_mutex); |
| |
| /* This worker only gets called on contexts that are scheduled *in*. This is |
| * because it only happens in response to an IRQ from a job that was |
| * running. |
| */ |
| KBASE_DEBUG_ASSERT(kbase_ctx_flag(kctx, KCTX_SCHEDULED)); |
| |
| if (katom->event_code == BASE_JD_EVENT_STOPPED) { |
| /* Atom has been promoted to stopped */ |
| unsigned long flags; |
| |
| mutex_unlock(&js_kctx_info->ctx.jsctx_mutex); |
| mutex_unlock(&js_devdata->queue_mutex); |
| |
| spin_lock_irqsave(&kbdev->hwaccess_lock, flags); |
| |
| katom->status = KBASE_JD_ATOM_STATE_IN_JS; |
| kbase_js_unpull(kctx, katom); |
| |
| spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags); |
| mutex_unlock(&jctx->lock); |
| |
| return; |
| } |
| |
| if ((katom->event_code != BASE_JD_EVENT_DONE) && |
| (!kbase_ctx_flag(katom->kctx, KCTX_DYING))) |
| dev_err(kbdev->dev, |
| "t6xx: GPU fault 0x%02lx from job slot %d\n", |
| (unsigned long)katom->event_code, |
| katom->slot_nr); |
| |
| if (kbase_hw_has_issue(kbdev, BASE_HW_ISSUE_8316)) |
| kbase_as_poking_timer_release_atom(kbdev, kctx, katom); |
| |
| /* Retain state before the katom disappears */ |
| kbasep_js_atom_retained_state_copy(&katom_retained_state, katom); |
| |
| context_idle = kbase_js_complete_atom_wq(kctx, katom); |
| |
| KBASE_DEBUG_ASSERT(kbasep_js_has_atom_finished(&katom_retained_state)); |
| |
| kbasep_js_remove_job(kbdev, kctx, katom); |
| mutex_unlock(&js_kctx_info->ctx.jsctx_mutex); |
| mutex_unlock(&js_devdata->queue_mutex); |
| katom->atom_flags &= ~KBASE_KATOM_FLAG_HOLDING_CTX_REF; |
| /* jd_done_nolock() requires the jsctx_mutex lock to be dropped */ |
| jd_done_nolock(katom, &kctx->completed_jobs); |
| |
| /* katom may have been freed now, do not use! */ |
| |
| if (context_idle) { |
| unsigned long flags; |
| |
| context_idle = false; |
| mutex_lock(&js_devdata->queue_mutex); |
| spin_lock_irqsave(&kbdev->hwaccess_lock, flags); |
| |
| /* If kbase_sched() has scheduled this context back in then |
| * KCTX_ACTIVE will have been set after we marked it as |
| * inactive, and another pm reference will have been taken, so |
| * drop our reference. But do not call kbase_jm_idle_ctx(), as |
| * the context is active and fast-starting is allowed. |
| * |
| * If an atom has been fast-started then kctx->atoms_pulled will |
| * be non-zero but KCTX_ACTIVE will still be false (as the |
| * previous pm reference has been inherited). Do NOT drop our |
| * reference, as it has been re-used, and leave the context as |
| * active. |
| * |
| * If no new atoms have been started then KCTX_ACTIVE will still |
| * be false and atoms_pulled will be zero, so drop the reference |
| * and call kbase_jm_idle_ctx(). |
| * |
| * As the checks are done under both the queue_mutex and |
| * hwaccess_lock is should be impossible for this to race |
| * with the scheduler code. |
| */ |
| if (kbase_ctx_flag(kctx, KCTX_ACTIVE) || |
| !atomic_read(&kctx->atoms_pulled)) { |
| /* Calling kbase_jm_idle_ctx() here will ensure that |
| * atoms are not fast-started when we drop the |
| * hwaccess_lock. This is not performed if |
| * KCTX_ACTIVE is set as in that case another pm |
| * reference has been taken and a fast-start would be |
| * valid. |
| */ |
| if (!kbase_ctx_flag(kctx, KCTX_ACTIVE)) |
| kbase_jm_idle_ctx(kbdev, kctx); |
| context_idle = true; |
| } else { |
| kbase_ctx_flag_set(kctx, KCTX_ACTIVE); |
| } |
| spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags); |
| mutex_unlock(&js_devdata->queue_mutex); |
| } |
| |
| /* |
| * Transaction complete |
| */ |
| mutex_unlock(&jctx->lock); |
| |
| /* Job is now no longer running, so can now safely release the context |
| * reference, and handle any actions that were logged against the atom's retained state */ |
| |
| kbasep_js_runpool_release_ctx_and_katom_retained_state(kbdev, kctx, &katom_retained_state); |
| |
| kbase_js_sched_all(kbdev); |
| |
| if (!atomic_dec_return(&kctx->work_count)) { |
| /* If worker now idle then post all events that jd_done_nolock() |
| * has queued */ |
| mutex_lock(&jctx->lock); |
| while (!list_empty(&kctx->completed_jobs)) { |
| struct kbase_jd_atom *atom = list_entry( |
| kctx->completed_jobs.next, |
| struct kbase_jd_atom, jd_item); |
| list_del(kctx->completed_jobs.next); |
| |
| kbase_event_post(kctx, atom); |
| } |
| mutex_unlock(&jctx->lock); |
| } |
| |
| kbase_backend_complete_wq_post_sched(kbdev, core_req); |
| |
| if (context_idle) |
| kbase_pm_context_idle(kbdev); |
| |
| KBASE_TRACE_ADD(kbdev, JD_DONE_WORKER_END, kctx, NULL, cache_jc, 0); |
| } |
| |
| /** |
| * jd_cancel_worker - Work queue job cancel function. |
| * @data: a &struct work_struct |
| * |
| * Only called as part of 'Zapping' a context (which occurs on termination). |
| * Operates serially with the kbase_jd_done_worker() on the work queue. |
| * |
| * This can only be called on contexts that aren't scheduled. |
| * |
| * We don't need to release most of the resources that would occur on |
| * kbase_jd_done() or kbase_jd_done_worker(), because the atoms here must not be |
| * running (by virtue of only being called on contexts that aren't |
| * scheduled). |
| */ |
| static void jd_cancel_worker(struct work_struct *data) |
| { |
| struct kbase_jd_atom *katom = container_of(data, struct kbase_jd_atom, work); |
| struct kbase_jd_context *jctx; |
| struct kbase_context *kctx; |
| struct kbasep_js_kctx_info *js_kctx_info; |
| bool need_to_try_schedule_context; |
| bool attr_state_changed; |
| struct kbase_device *kbdev; |
| |
| /* Soft jobs should never reach this function */ |
| KBASE_DEBUG_ASSERT((katom->core_req & BASE_JD_REQ_SOFT_JOB) == 0); |
| |
| kctx = katom->kctx; |
| kbdev = kctx->kbdev; |
| jctx = &kctx->jctx; |
| js_kctx_info = &kctx->jctx.sched_info; |
| |
| KBASE_TRACE_ADD(kbdev, JD_CANCEL_WORKER, kctx, katom, katom->jc, 0); |
| |
| /* This only gets called on contexts that are scheduled out. Hence, we must |
| * make sure we don't de-ref the number of running jobs (there aren't |
| * any), nor must we try to schedule out the context (it's already |
| * scheduled out). |
| */ |
| KBASE_DEBUG_ASSERT(!kbase_ctx_flag(kctx, KCTX_SCHEDULED)); |
| |
| /* Scheduler: Remove the job from the system */ |
| mutex_lock(&js_kctx_info->ctx.jsctx_mutex); |
| attr_state_changed = kbasep_js_remove_cancelled_job(kbdev, kctx, katom); |
| mutex_unlock(&js_kctx_info->ctx.jsctx_mutex); |
| |
| mutex_lock(&jctx->lock); |
| |
| need_to_try_schedule_context = jd_done_nolock(katom, NULL); |
| /* Because we're zapping, we're not adding any more jobs to this ctx, so no need to |
| * schedule the context. There's also no need for the jsctx_mutex to have been taken |
| * around this too. */ |
| KBASE_DEBUG_ASSERT(!need_to_try_schedule_context); |
| |
| /* katom may have been freed now, do not use! */ |
| mutex_unlock(&jctx->lock); |
| |
| if (attr_state_changed) |
| kbase_js_sched_all(kbdev); |
| } |
| |
| /** |
| * kbase_jd_done - Complete a job that has been removed from the Hardware |
| * @katom: atom which has been completed |
| * @slot_nr: slot the atom was on |
| * @end_timestamp: completion time |
| * @done_code: completion code |
| * |
| * This must be used whenever a job has been removed from the Hardware, e.g.: |
| * An IRQ indicates that the job finished (for both error and 'done' codes), or |
| * the job was evicted from the JS_HEAD_NEXT registers during a Soft/Hard stop. |
| * |
| * Some work is carried out immediately, and the rest is deferred onto a |
| * workqueue |
| * |
| * Context: |
| * This can be called safely from atomic context. |
| * The caller must hold kbdev->hwaccess_lock |
| */ |
| void kbase_jd_done(struct kbase_jd_atom *katom, int slot_nr, |
| ktime_t *end_timestamp, kbasep_js_atom_done_code done_code) |
| { |
| struct kbase_context *kctx; |
| struct kbase_device *kbdev; |
| |
| KBASE_DEBUG_ASSERT(katom); |
| kctx = katom->kctx; |
| KBASE_DEBUG_ASSERT(kctx); |
| kbdev = kctx->kbdev; |
| KBASE_DEBUG_ASSERT(kbdev); |
| |
| if (done_code & KBASE_JS_ATOM_DONE_EVICTED_FROM_NEXT) |
| katom->event_code = BASE_JD_EVENT_REMOVED_FROM_NEXT; |
| |
| KBASE_TRACE_ADD(kbdev, JD_DONE, kctx, katom, katom->jc, 0); |
| |
| kbase_job_check_leave_disjoint(kbdev, katom); |
| |
| katom->slot_nr = slot_nr; |
| |
| atomic_inc(&kctx->work_count); |
| |
| #ifdef CONFIG_DEBUG_FS |
| /* a failed job happened and is waiting for dumping*/ |
| if (!katom->will_fail_event_code && |
| kbase_debug_job_fault_process(katom, katom->event_code)) |
| return; |
| #endif |
| |
| WARN_ON(work_pending(&katom->work)); |
| INIT_WORK(&katom->work, kbase_jd_done_worker); |
| queue_work(kctx->jctx.job_done_wq, &katom->work); |
| } |
| |
| KBASE_EXPORT_TEST_API(kbase_jd_done); |
| |
| void kbase_jd_cancel(struct kbase_device *kbdev, struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx; |
| |
| KBASE_DEBUG_ASSERT(NULL != kbdev); |
| KBASE_DEBUG_ASSERT(NULL != katom); |
| kctx = katom->kctx; |
| KBASE_DEBUG_ASSERT(NULL != kctx); |
| |
| KBASE_TRACE_ADD(kbdev, JD_CANCEL, kctx, katom, katom->jc, 0); |
| |
| /* This should only be done from a context that is not scheduled */ |
| KBASE_DEBUG_ASSERT(!kbase_ctx_flag(kctx, KCTX_SCHEDULED)); |
| |
| WARN_ON(work_pending(&katom->work)); |
| |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| |
| INIT_WORK(&katom->work, jd_cancel_worker); |
| queue_work(kctx->jctx.job_done_wq, &katom->work); |
| } |
| |
| |
| void kbase_jd_zap_context(struct kbase_context *kctx) |
| { |
| struct kbase_jd_atom *katom; |
| struct list_head *entry, *tmp; |
| struct kbase_device *kbdev; |
| |
| KBASE_DEBUG_ASSERT(kctx); |
| |
| kbdev = kctx->kbdev; |
| |
| KBASE_TRACE_ADD(kbdev, JD_ZAP_CONTEXT, kctx, NULL, 0u, 0u); |
| |
| kbase_js_zap_context(kctx); |
| |
| mutex_lock(&kctx->jctx.lock); |
| |
| /* |
| * While holding the struct kbase_jd_context lock clean up jobs which are known to kbase but are |
| * queued outside the job scheduler. |
| */ |
| |
| del_timer_sync(&kctx->soft_job_timeout); |
| list_for_each_safe(entry, tmp, &kctx->waiting_soft_jobs) { |
| katom = list_entry(entry, struct kbase_jd_atom, queue); |
| kbase_cancel_soft_job(katom); |
| } |
| |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| kbase_dma_fence_cancel_all_atoms(kctx); |
| #endif |
| |
| mutex_unlock(&kctx->jctx.lock); |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| /* Flush dma-fence workqueue to ensure that any callbacks that may have |
| * been queued are done before continuing. |
| */ |
| flush_workqueue(kctx->dma_fence.wq); |
| #endif |
| |
| #ifdef CONFIG_DEBUG_FS |
| kbase_debug_job_fault_kctx_unblock(kctx); |
| #endif |
| |
| kbase_jm_wait_for_zero_jobs(kctx); |
| } |
| |
| KBASE_EXPORT_TEST_API(kbase_jd_zap_context); |
| |
| int kbase_jd_init(struct kbase_context *kctx) |
| { |
| int i; |
| int mali_err = 0; |
| |
| KBASE_DEBUG_ASSERT(kctx); |
| |
| kctx->jctx.job_done_wq = alloc_workqueue("mali_jd", |
| WQ_HIGHPRI | WQ_UNBOUND, 1); |
| if (NULL == kctx->jctx.job_done_wq) { |
| mali_err = -ENOMEM; |
| goto out1; |
| } |
| |
| for (i = 0; i < BASE_JD_ATOM_COUNT; i++) { |
| init_waitqueue_head(&kctx->jctx.atoms[i].completed); |
| |
| INIT_LIST_HEAD(&kctx->jctx.atoms[i].dep_head[0]); |
| INIT_LIST_HEAD(&kctx->jctx.atoms[i].dep_head[1]); |
| |
| /* Catch userspace attempting to use an atom which doesn't exist as a pre-dependency */ |
| kctx->jctx.atoms[i].event_code = BASE_JD_EVENT_JOB_INVALID; |
| kctx->jctx.atoms[i].status = KBASE_JD_ATOM_STATE_UNUSED; |
| |
| #if defined(CONFIG_MALI_DMA_FENCE) || defined(CONFIG_SYNC_FILE) |
| kctx->jctx.atoms[i].dma_fence.context = |
| dma_fence_context_alloc(1); |
| atomic_set(&kctx->jctx.atoms[i].dma_fence.seqno, 0); |
| INIT_LIST_HEAD(&kctx->jctx.atoms[i].dma_fence.callbacks); |
| #endif |
| } |
| |
| mutex_init(&kctx->jctx.lock); |
| |
| init_waitqueue_head(&kctx->jctx.zero_jobs_wait); |
| |
| spin_lock_init(&kctx->jctx.tb_lock); |
| |
| kctx->jctx.job_nr = 0; |
| INIT_LIST_HEAD(&kctx->completed_jobs); |
| atomic_set(&kctx->work_count, 0); |
| |
| return 0; |
| |
| out1: |
| return mali_err; |
| } |
| |
| KBASE_EXPORT_TEST_API(kbase_jd_init); |
| |
| void kbase_jd_exit(struct kbase_context *kctx) |
| { |
| KBASE_DEBUG_ASSERT(kctx); |
| |
| /* Work queue is emptied by this */ |
| destroy_workqueue(kctx->jctx.job_done_wq); |
| } |
| |
| KBASE_EXPORT_TEST_API(kbase_jd_exit); |