| // SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note |
| /* |
| * |
| * (C) COPYRIGHT 2011-2022 ARM Limited. All rights reserved. |
| * |
| * This program is free software and is provided to you under the terms of the |
| * GNU General Public License version 2 as published by the Free Software |
| * Foundation, and any use by you of this program is subject to the terms |
| * of such GNU license. |
| * |
| * This program is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| * GNU General Public License for more details. |
| * |
| * You should have received a copy of the GNU General Public License |
| * along with this program; if not, you can access it online at |
| * http://www.gnu.org/licenses/gpl-2.0.html. |
| * |
| */ |
| |
| #include <mali_kbase.h> |
| |
| #include <linux/dma-buf.h> |
| #include <asm/cacheflush.h> |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| #include <mali_kbase_sync.h> |
| #endif |
| #include <linux/dma-mapping.h> |
| #include <uapi/gpu/arm/midgard/mali_base_kernel.h> |
| #include <mali_kbase_hwaccess_time.h> |
| #include <mali_kbase_kinstr_jm.h> |
| #include <mali_kbase_mem_linux.h> |
| #include <tl/mali_kbase_tracepoints.h> |
| #include <mali_linux_trace.h> |
| #include <linux/version.h> |
| #include <linux/ktime.h> |
| #include <linux/pfn.h> |
| #include <linux/sched.h> |
| #include <linux/kernel.h> |
| #include <linux/cache.h> |
| |
| #if !MALI_USE_CSF |
| /** |
| * DOC: This file implements the logic behind software only jobs that are |
| * executed within the driver rather than being handed over to the GPU. |
| */ |
| |
| static void kbasep_add_waiting_soft_job(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| unsigned long lflags; |
| |
| spin_lock_irqsave(&kctx->waiting_soft_jobs_lock, lflags); |
| list_add_tail(&katom->queue, &kctx->waiting_soft_jobs); |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| } |
| |
| void kbasep_remove_waiting_soft_job(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| unsigned long lflags; |
| |
| spin_lock_irqsave(&kctx->waiting_soft_jobs_lock, lflags); |
| list_del(&katom->queue); |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| } |
| |
| static void kbasep_add_waiting_with_timeout(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| |
| /* Record the start time of this atom so we could cancel it at |
| * the right time. |
| */ |
| katom->start_timestamp = ktime_get_raw(); |
| |
| /* Add the atom to the waiting list before the timer is |
| * (re)started to make sure that it gets processed. |
| */ |
| kbasep_add_waiting_soft_job(katom); |
| |
| /* Schedule timeout of this atom after a period if it is not active */ |
| if (!timer_pending(&kctx->soft_job_timeout)) { |
| int timeout_ms = atomic_read( |
| &kctx->kbdev->js_data.soft_job_timeout_ms); |
| mod_timer(&kctx->soft_job_timeout, |
| jiffies + msecs_to_jiffies(timeout_ms)); |
| } |
| } |
| |
| static int kbasep_read_soft_event_status( |
| struct kbase_context *kctx, u64 evt, unsigned char *status) |
| { |
| unsigned char *mapped_evt; |
| struct kbase_vmap_struct map; |
| |
| mapped_evt = kbase_vmap_prot(kctx, evt, sizeof(*mapped_evt), |
| KBASE_REG_CPU_RD, &map); |
| if (!mapped_evt) |
| return -EFAULT; |
| |
| *status = *mapped_evt; |
| |
| kbase_vunmap(kctx, &map); |
| |
| return 0; |
| } |
| |
| static int kbasep_write_soft_event_status( |
| struct kbase_context *kctx, u64 evt, unsigned char new_status) |
| { |
| unsigned char *mapped_evt; |
| struct kbase_vmap_struct map; |
| |
| if ((new_status != BASE_JD_SOFT_EVENT_SET) && |
| (new_status != BASE_JD_SOFT_EVENT_RESET)) |
| return -EINVAL; |
| |
| mapped_evt = kbase_vmap_prot(kctx, evt, sizeof(*mapped_evt), |
| KBASE_REG_CPU_WR, &map); |
| if (!mapped_evt) |
| return -EFAULT; |
| |
| *mapped_evt = new_status; |
| |
| kbase_vunmap(kctx, &map); |
| |
| return 0; |
| } |
| |
| static int kbase_dump_cpu_gpu_time(struct kbase_jd_atom *katom) |
| { |
| struct kbase_vmap_struct map; |
| void *user_result; |
| struct timespec64 ts; |
| struct base_dump_cpu_gpu_counters data; |
| u64 system_time = 0ULL; |
| u64 cycle_counter; |
| u64 jc = katom->jc; |
| struct kbase_context *kctx = katom->kctx; |
| int pm_active_err; |
| |
| memset(&data, 0, sizeof(data)); |
| |
| /* Take the PM active reference as late as possible - otherwise, it could |
| * delay suspend until we process the atom (which may be at the end of a |
| * long chain of dependencies |
| */ |
| #ifdef CONFIG_MALI_ARBITER_SUPPORT |
| atomic_inc(&kctx->kbdev->pm.gpu_users_waiting); |
| #endif /* CONFIG_MALI_ARBITER_SUPPORT */ |
| pm_active_err = kbase_pm_context_active_handle_suspend(kctx->kbdev, KBASE_PM_SUSPEND_HANDLER_DONT_REACTIVATE); |
| if (pm_active_err) { |
| struct kbasep_js_device_data *js_devdata = &kctx->kbdev->js_data; |
| |
| /* We're suspended - queue this on the list of suspended jobs |
| * Use dep_item[1], because dep_item[0] was previously in use |
| * for 'waiting_soft_jobs'. |
| */ |
| mutex_lock(&js_devdata->runpool_mutex); |
| list_add_tail(&katom->dep_item[1], &js_devdata->suspended_soft_jobs_list); |
| mutex_unlock(&js_devdata->runpool_mutex); |
| |
| /* Also adding this to the list of waiting soft job */ |
| kbasep_add_waiting_soft_job(katom); |
| |
| return pm_active_err; |
| } |
| #ifdef CONFIG_MALI_ARBITER_SUPPORT |
| else |
| atomic_dec(&kctx->kbdev->pm.gpu_users_waiting); |
| #endif /* CONFIG_MALI_ARBITER_SUPPORT */ |
| |
| kbase_backend_get_gpu_time(kctx->kbdev, &cycle_counter, &system_time, |
| &ts); |
| |
| kbase_pm_context_idle(kctx->kbdev); |
| |
| data.sec = ts.tv_sec; |
| data.usec = ts.tv_nsec / 1000; |
| data.system_time = system_time; |
| data.cycle_counter = cycle_counter; |
| |
| /* Assume this atom will be cancelled until we know otherwise */ |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| |
| /* GPU_WR access is checked on the range for returning the result to |
| * userspace for the following reasons: |
| * - security, this is currently how imported user bufs are checked. |
| * - userspace ddk guaranteed to assume region was mapped as GPU_WR |
| */ |
| user_result = kbase_vmap_prot(kctx, jc, sizeof(data), KBASE_REG_GPU_WR, &map); |
| if (!user_result) |
| return 0; |
| |
| memcpy(user_result, &data, sizeof(data)); |
| |
| kbase_vunmap(kctx, &map); |
| |
| /* Atom was fine - mark it as done */ |
| katom->event_code = BASE_JD_EVENT_DONE; |
| |
| return 0; |
| } |
| |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| /* Called by the explicit fence mechanism when a fence wait has completed */ |
| void kbase_soft_event_wait_callback(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| |
| mutex_lock(&kctx->jctx.lock); |
| kbasep_remove_waiting_soft_job(katom); |
| kbase_finish_soft_job(katom); |
| if (kbase_jd_done_nolock(katom, true)) |
| kbase_js_sched_all(kctx->kbdev); |
| mutex_unlock(&kctx->jctx.lock); |
| } |
| #endif |
| |
| static void kbasep_soft_event_complete_job(struct work_struct *work) |
| { |
| struct kbase_jd_atom *katom = container_of(work, struct kbase_jd_atom, |
| work); |
| struct kbase_context *kctx = katom->kctx; |
| int resched; |
| |
| mutex_lock(&kctx->jctx.lock); |
| resched = kbase_jd_done_nolock(katom, true); |
| mutex_unlock(&kctx->jctx.lock); |
| |
| if (resched) |
| kbase_js_sched_all(kctx->kbdev); |
| } |
| |
| void kbasep_complete_triggered_soft_events(struct kbase_context *kctx, u64 evt) |
| { |
| int cancel_timer = 1; |
| struct list_head *entry, *tmp; |
| unsigned long lflags; |
| |
| spin_lock_irqsave(&kctx->waiting_soft_jobs_lock, lflags); |
| list_for_each_safe(entry, tmp, &kctx->waiting_soft_jobs) { |
| struct kbase_jd_atom *katom = list_entry( |
| entry, struct kbase_jd_atom, queue); |
| |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| case BASE_JD_REQ_SOFT_EVENT_WAIT: |
| if (katom->jc == evt) { |
| list_del(&katom->queue); |
| |
| katom->event_code = BASE_JD_EVENT_DONE; |
| INIT_WORK(&katom->work, |
| kbasep_soft_event_complete_job); |
| queue_work(kctx->jctx.job_done_wq, |
| &katom->work); |
| } else { |
| /* There are still other waiting jobs, we cannot |
| * cancel the timer yet. |
| */ |
| cancel_timer = 0; |
| } |
| break; |
| #ifdef CONFIG_MALI_FENCE_DEBUG |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| /* Keep the timer running if fence debug is enabled and |
| * there are waiting fence jobs. |
| */ |
| cancel_timer = 0; |
| break; |
| #endif |
| } |
| } |
| |
| if (cancel_timer) |
| del_timer(&kctx->soft_job_timeout); |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| } |
| |
| #ifdef CONFIG_MALI_FENCE_DEBUG |
| static void kbase_fence_debug_check_atom(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct device *dev = kctx->kbdev->dev; |
| int i; |
| |
| for (i = 0; i < 2; i++) { |
| struct kbase_jd_atom *dep; |
| |
| list_for_each_entry(dep, &katom->dep_head[i], dep_item[i]) { |
| if (dep->status == KBASE_JD_ATOM_STATE_UNUSED || |
| dep->status == KBASE_JD_ATOM_STATE_COMPLETED) |
| continue; |
| |
| if ((dep->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) |
| == BASE_JD_REQ_SOFT_FENCE_TRIGGER) { |
| /* Found blocked trigger fence. */ |
| struct kbase_sync_fence_info info; |
| |
| if (!kbase_sync_fence_in_info_get(dep, &info)) { |
| dev_warn(dev, |
| "\tVictim trigger atom %d fence [%pK] %s: %s\n", |
| kbase_jd_atom_id(kctx, dep), |
| info.fence, |
| info.name, |
| kbase_sync_status_string(info.status)); |
| } |
| } |
| |
| kbase_fence_debug_check_atom(dep); |
| } |
| } |
| } |
| |
| static void kbase_fence_debug_wait_timeout(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct device *dev = katom->kctx->kbdev->dev; |
| int timeout_ms = atomic_read(&kctx->kbdev->js_data.soft_job_timeout_ms); |
| unsigned long lflags; |
| struct kbase_sync_fence_info info; |
| |
| spin_lock_irqsave(&kctx->waiting_soft_jobs_lock, lflags); |
| |
| if (kbase_sync_fence_in_info_get(katom, &info)) { |
| /* Fence must have signaled just after timeout. */ |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| return; |
| } |
| |
| dev_warn(dev, "ctx %d_%d: Atom %d still waiting for fence [%pK] after %dms\n", |
| kctx->tgid, kctx->id, |
| kbase_jd_atom_id(kctx, katom), |
| info.fence, timeout_ms); |
| dev_warn(dev, "\tGuilty fence [%pK] %s: %s\n", |
| info.fence, info.name, |
| kbase_sync_status_string(info.status)); |
| |
| /* Search for blocked trigger atoms */ |
| kbase_fence_debug_check_atom(katom); |
| |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| |
| kbase_sync_fence_in_dump(katom); |
| } |
| |
| struct kbase_fence_debug_work { |
| struct kbase_jd_atom *katom; |
| struct work_struct work; |
| }; |
| |
| static void kbase_fence_debug_wait_timeout_worker(struct work_struct *work) |
| { |
| struct kbase_fence_debug_work *w = container_of(work, |
| struct kbase_fence_debug_work, work); |
| struct kbase_jd_atom *katom = w->katom; |
| struct kbase_context *kctx = katom->kctx; |
| |
| mutex_lock(&kctx->jctx.lock); |
| kbase_fence_debug_wait_timeout(katom); |
| mutex_unlock(&kctx->jctx.lock); |
| |
| kfree(w); |
| } |
| |
| static void kbase_fence_debug_timeout(struct kbase_jd_atom *katom) |
| { |
| struct kbase_fence_debug_work *work; |
| struct kbase_context *kctx = katom->kctx; |
| |
| /* Enqueue fence debug worker. Use job_done_wq to get |
| * debug print ordered with job completion. |
| */ |
| work = kzalloc(sizeof(struct kbase_fence_debug_work), GFP_ATOMIC); |
| /* Ignore allocation failure. */ |
| if (work) { |
| work->katom = katom; |
| INIT_WORK(&work->work, kbase_fence_debug_wait_timeout_worker); |
| queue_work(kctx->jctx.job_done_wq, &work->work); |
| } |
| } |
| #endif /* CONFIG_MALI_FENCE_DEBUG */ |
| |
| void kbasep_soft_job_timeout_worker(struct timer_list *timer) |
| { |
| struct kbase_context *kctx = container_of(timer, struct kbase_context, |
| soft_job_timeout); |
| u32 timeout_ms = (u32)atomic_read( |
| &kctx->kbdev->js_data.soft_job_timeout_ms); |
| ktime_t cur_time = ktime_get_raw(); |
| bool restarting = false; |
| unsigned long lflags; |
| struct list_head *entry, *tmp; |
| |
| spin_lock_irqsave(&kctx->waiting_soft_jobs_lock, lflags); |
| list_for_each_safe(entry, tmp, &kctx->waiting_soft_jobs) { |
| struct kbase_jd_atom *katom = list_entry(entry, |
| struct kbase_jd_atom, queue); |
| s64 elapsed_time = ktime_to_ms(ktime_sub(cur_time, |
| katom->start_timestamp)); |
| |
| if (elapsed_time < (s64)timeout_ms) { |
| restarting = true; |
| continue; |
| } |
| |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| case BASE_JD_REQ_SOFT_EVENT_WAIT: |
| /* Take it out of the list to ensure that it |
| * will be cancelled in all cases |
| */ |
| list_del(&katom->queue); |
| |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| INIT_WORK(&katom->work, kbasep_soft_event_complete_job); |
| queue_work(kctx->jctx.job_done_wq, &katom->work); |
| break; |
| #ifdef CONFIG_MALI_FENCE_DEBUG |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| kbase_fence_debug_timeout(katom); |
| break; |
| #endif |
| } |
| } |
| |
| if (restarting) |
| mod_timer(timer, jiffies + msecs_to_jiffies(timeout_ms)); |
| spin_unlock_irqrestore(&kctx->waiting_soft_jobs_lock, lflags); |
| } |
| |
| static int kbasep_soft_event_wait(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| unsigned char status; |
| |
| /* The status of this soft-job is stored in jc */ |
| if (kbasep_read_soft_event_status(kctx, katom->jc, &status)) { |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| return 0; |
| } |
| |
| if (status == BASE_JD_SOFT_EVENT_SET) |
| return 0; /* Event already set, nothing to do */ |
| |
| kbasep_add_waiting_with_timeout(katom); |
| |
| return 1; |
| } |
| |
| static void kbasep_soft_event_update_locked(struct kbase_jd_atom *katom, |
| unsigned char new_status) |
| { |
| /* Complete jobs waiting on the same event */ |
| struct kbase_context *kctx = katom->kctx; |
| |
| if (kbasep_write_soft_event_status(kctx, katom->jc, new_status) != 0) { |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| return; |
| } |
| |
| if (new_status == BASE_JD_SOFT_EVENT_SET) |
| kbasep_complete_triggered_soft_events(kctx, katom->jc); |
| } |
| |
| /** |
| * kbase_soft_event_update() - Update soft event state |
| * @kctx: Pointer to context |
| * @event: Event to update |
| * @new_status: New status value of event |
| * |
| * Update the event, and wake up any atoms waiting for the event. |
| * |
| * Return: 0 on success, a negative error code on failure. |
| */ |
| int kbase_soft_event_update(struct kbase_context *kctx, |
| u64 event, |
| unsigned char new_status) |
| { |
| int err = 0; |
| |
| mutex_lock(&kctx->jctx.lock); |
| |
| if (kbasep_write_soft_event_status(kctx, event, new_status)) { |
| err = -ENOENT; |
| goto out; |
| } |
| |
| if (new_status == BASE_JD_SOFT_EVENT_SET) |
| kbasep_complete_triggered_soft_events(kctx, event); |
| |
| out: |
| mutex_unlock(&kctx->jctx.lock); |
| |
| return err; |
| } |
| |
| static void kbasep_soft_event_cancel_job(struct kbase_jd_atom *katom) |
| { |
| katom->event_code = BASE_JD_EVENT_JOB_CANCELLED; |
| if (kbase_jd_done_nolock(katom, true)) |
| kbase_js_sched_all(katom->kctx->kbdev); |
| } |
| |
| static void kbase_debug_copy_finish(struct kbase_jd_atom *katom) |
| { |
| struct kbase_debug_copy_buffer *buffers = katom->softjob_data; |
| unsigned int i; |
| unsigned int nr = katom->nr_extres; |
| |
| if (!buffers) |
| return; |
| |
| kbase_gpu_vm_lock(katom->kctx); |
| for (i = 0; i < nr; i++) { |
| int p; |
| struct kbase_mem_phy_alloc *gpu_alloc = buffers[i].gpu_alloc; |
| |
| if (!buffers[i].pages) |
| break; |
| for (p = 0; p < buffers[i].nr_pages; p++) { |
| struct page *pg = buffers[i].pages[p]; |
| |
| if (pg) |
| put_page(pg); |
| } |
| if (buffers[i].is_vmalloc) |
| vfree(buffers[i].pages); |
| else |
| kfree(buffers[i].pages); |
| if (gpu_alloc) { |
| switch (gpu_alloc->type) { |
| case KBASE_MEM_TYPE_IMPORTED_USER_BUF: |
| { |
| kbase_free_user_buffer(&buffers[i]); |
| break; |
| } |
| default: |
| /* Nothing to be done. */ |
| break; |
| } |
| kbase_mem_phy_alloc_put(gpu_alloc); |
| } |
| } |
| kbase_gpu_vm_unlock(katom->kctx); |
| kfree(buffers); |
| |
| katom->softjob_data = NULL; |
| } |
| |
| static int kbase_debug_copy_prepare(struct kbase_jd_atom *katom) |
| { |
| struct kbase_debug_copy_buffer *buffers; |
| struct base_jd_debug_copy_buffer *user_buffers = NULL; |
| unsigned int i; |
| unsigned int nr = katom->nr_extres; |
| int ret = 0; |
| void __user *user_structs = (void __user *)(uintptr_t)katom->jc; |
| |
| if (!user_structs) |
| return -EINVAL; |
| |
| buffers = kcalloc(nr, sizeof(*buffers), GFP_KERNEL); |
| if (!buffers) { |
| ret = -ENOMEM; |
| goto out_cleanup; |
| } |
| katom->softjob_data = buffers; |
| |
| user_buffers = kmalloc_array(nr, sizeof(*user_buffers), GFP_KERNEL); |
| |
| if (!user_buffers) { |
| ret = -ENOMEM; |
| goto out_cleanup; |
| } |
| |
| ret = copy_from_user(user_buffers, user_structs, |
| sizeof(*user_buffers)*nr); |
| if (ret) { |
| ret = -EFAULT; |
| goto out_cleanup; |
| } |
| |
| for (i = 0; i < nr; i++) { |
| u64 addr = user_buffers[i].address; |
| u64 page_addr = addr & PAGE_MASK; |
| u64 end_page_addr = addr + user_buffers[i].size - 1; |
| u64 last_page_addr = end_page_addr & PAGE_MASK; |
| int nr_pages = (last_page_addr-page_addr)/PAGE_SIZE+1; |
| int pinned_pages; |
| struct kbase_va_region *reg; |
| struct base_external_resource user_extres; |
| |
| if (!addr) |
| continue; |
| |
| if (last_page_addr < page_addr) { |
| ret = -EINVAL; |
| goto out_cleanup; |
| } |
| |
| buffers[i].nr_pages = nr_pages; |
| buffers[i].offset = addr & ~PAGE_MASK; |
| if (buffers[i].offset >= PAGE_SIZE) { |
| ret = -EINVAL; |
| goto out_cleanup; |
| } |
| buffers[i].size = user_buffers[i].size; |
| |
| if (nr_pages > (KBASE_MEM_PHY_ALLOC_LARGE_THRESHOLD / |
| sizeof(struct page *))) { |
| buffers[i].is_vmalloc = true; |
| buffers[i].pages = vzalloc(nr_pages * |
| sizeof(struct page *)); |
| } else { |
| buffers[i].is_vmalloc = false; |
| buffers[i].pages = kcalloc(nr_pages, |
| sizeof(struct page *), GFP_KERNEL); |
| } |
| |
| if (!buffers[i].pages) { |
| ret = -ENOMEM; |
| goto out_cleanup; |
| } |
| |
| pinned_pages = get_user_pages_fast(page_addr, |
| nr_pages, |
| 1, /* Write */ |
| buffers[i].pages); |
| if (pinned_pages < 0) { |
| /* get_user_pages_fast has failed - page array is not |
| * valid. Don't try to release any pages. |
| */ |
| buffers[i].nr_pages = 0; |
| |
| ret = pinned_pages; |
| goto out_cleanup; |
| } |
| if (pinned_pages != nr_pages) { |
| /* Adjust number of pages, so that we only attempt to |
| * release pages in the array that we know are valid. |
| */ |
| buffers[i].nr_pages = pinned_pages; |
| |
| ret = -EINVAL; |
| goto out_cleanup; |
| } |
| |
| user_extres = user_buffers[i].extres; |
| if (user_extres.ext_resource == 0ULL) { |
| ret = -EINVAL; |
| goto out_cleanup; |
| } |
| |
| kbase_gpu_vm_lock(katom->kctx); |
| reg = kbase_region_tracker_find_region_enclosing_address( |
| katom->kctx, user_extres.ext_resource & |
| ~BASE_EXT_RES_ACCESS_EXCLUSIVE); |
| |
| if (kbase_is_region_invalid_or_free(reg) || |
| reg->gpu_alloc == NULL) { |
| ret = -EINVAL; |
| goto out_unlock; |
| } |
| |
| buffers[i].gpu_alloc = kbase_mem_phy_alloc_get(reg->gpu_alloc); |
| buffers[i].nr_extres_pages = reg->nr_pages; |
| |
| if (reg->nr_pages*PAGE_SIZE != buffers[i].size) |
| dev_warn(katom->kctx->kbdev->dev, "Copy buffer is not of same size as the external resource to copy.\n"); |
| |
| switch (reg->gpu_alloc->type) { |
| case KBASE_MEM_TYPE_IMPORTED_USER_BUF: |
| { |
| struct kbase_mem_phy_alloc *alloc = reg->gpu_alloc; |
| unsigned long nr_pages = |
| alloc->imported.user_buf.nr_pages; |
| |
| if (alloc->imported.user_buf.mm != current->mm) { |
| ret = -EINVAL; |
| goto out_unlock; |
| } |
| buffers[i].extres_pages = kcalloc(nr_pages, |
| sizeof(struct page *), GFP_KERNEL); |
| if (!buffers[i].extres_pages) { |
| ret = -ENOMEM; |
| goto out_unlock; |
| } |
| |
| ret = get_user_pages_fast( |
| alloc->imported.user_buf.address, |
| nr_pages, 0, |
| buffers[i].extres_pages); |
| if (ret != nr_pages) { |
| /* Adjust number of pages, so that we only |
| * attempt to release pages in the array that we |
| * know are valid. |
| */ |
| if (ret < 0) |
| buffers[i].nr_extres_pages = 0; |
| else |
| buffers[i].nr_extres_pages = ret; |
| |
| goto out_unlock; |
| } |
| ret = 0; |
| break; |
| } |
| default: |
| /* Nothing to be done. */ |
| break; |
| } |
| kbase_gpu_vm_unlock(katom->kctx); |
| } |
| kfree(user_buffers); |
| |
| return ret; |
| |
| out_unlock: |
| kbase_gpu_vm_unlock(katom->kctx); |
| |
| out_cleanup: |
| /* Frees allocated memory for kbase_debug_copy_job struct, including |
| * members, and sets jc to 0 |
| */ |
| kbase_debug_copy_finish(katom); |
| kfree(user_buffers); |
| |
| return ret; |
| } |
| #endif /* !MALI_USE_CSF */ |
| |
| #if KERNEL_VERSION(5, 6, 0) <= LINUX_VERSION_CODE |
| static void *dma_buf_kmap_page(struct kbase_mem_phy_alloc *gpu_alloc, |
| unsigned long page_num, struct page **page) |
| { |
| struct sg_table *sgt = gpu_alloc->imported.umm.sgt; |
| struct sg_page_iter sg_iter; |
| unsigned long page_index = 0; |
| |
| if (WARN_ON(gpu_alloc->type != KBASE_MEM_TYPE_IMPORTED_UMM)) |
| return NULL; |
| |
| if (!sgt) |
| return NULL; |
| |
| if (WARN_ON(page_num >= gpu_alloc->nents)) |
| return NULL; |
| |
| for_each_sg_page(sgt->sgl, &sg_iter, sgt->nents, 0) { |
| if (page_index == page_num) { |
| *page = sg_page_iter_page(&sg_iter); |
| |
| return kmap(*page); |
| } |
| page_index++; |
| } |
| |
| return NULL; |
| } |
| #endif |
| |
| int kbase_mem_copy_from_extres(struct kbase_context *kctx, |
| struct kbase_debug_copy_buffer *buf_data) |
| { |
| unsigned int i; |
| unsigned int target_page_nr = 0; |
| struct page **pages = buf_data->pages; |
| u64 offset = buf_data->offset; |
| size_t extres_size = buf_data->nr_extres_pages*PAGE_SIZE; |
| size_t to_copy = min(extres_size, buf_data->size); |
| struct kbase_mem_phy_alloc *gpu_alloc = buf_data->gpu_alloc; |
| int ret = 0; |
| size_t dma_to_copy; |
| |
| KBASE_DEBUG_ASSERT(pages != NULL); |
| |
| kbase_gpu_vm_lock(kctx); |
| if (!gpu_alloc) { |
| ret = -EINVAL; |
| goto out_unlock; |
| } |
| |
| switch (gpu_alloc->type) { |
| case KBASE_MEM_TYPE_IMPORTED_USER_BUF: |
| { |
| for (i = 0; i < buf_data->nr_extres_pages && |
| target_page_nr < buf_data->nr_pages; i++) { |
| struct page *pg = buf_data->extres_pages[i]; |
| void *extres_page = kmap(pg); |
| |
| if (extres_page) { |
| ret = kbase_mem_copy_to_pinned_user_pages( |
| pages, extres_page, &to_copy, |
| buf_data->nr_pages, |
| &target_page_nr, offset); |
| kunmap(pg); |
| if (ret) |
| goto out_unlock; |
| } |
| } |
| } |
| break; |
| case KBASE_MEM_TYPE_IMPORTED_UMM: { |
| struct dma_buf *dma_buf = gpu_alloc->imported.umm.dma_buf; |
| |
| KBASE_DEBUG_ASSERT(dma_buf != NULL); |
| if (dma_buf->size > buf_data->nr_extres_pages * PAGE_SIZE) |
| dev_warn(kctx->kbdev->dev, "External resources buffer size mismatch"); |
| |
| dma_to_copy = min(dma_buf->size, |
| (size_t)(buf_data->nr_extres_pages * PAGE_SIZE)); |
| ret = dma_buf_begin_cpu_access(dma_buf, DMA_FROM_DEVICE); |
| if (ret) |
| goto out_unlock; |
| |
| for (i = 0; i < dma_to_copy/PAGE_SIZE && |
| target_page_nr < buf_data->nr_pages; i++) { |
| #if KERNEL_VERSION(5, 6, 0) <= LINUX_VERSION_CODE |
| struct page *pg; |
| void *extres_page = dma_buf_kmap_page(gpu_alloc, i, &pg); |
| #else |
| void *extres_page = dma_buf_kmap(dma_buf, i); |
| #endif |
| if (extres_page) { |
| ret = kbase_mem_copy_to_pinned_user_pages( |
| pages, extres_page, &to_copy, |
| buf_data->nr_pages, |
| &target_page_nr, offset); |
| |
| #if KERNEL_VERSION(5, 6, 0) <= LINUX_VERSION_CODE |
| kunmap(pg); |
| #else |
| dma_buf_kunmap(dma_buf, i, extres_page); |
| #endif |
| if (ret) |
| break; |
| } |
| } |
| dma_buf_end_cpu_access(dma_buf, DMA_FROM_DEVICE); |
| break; |
| } |
| default: |
| ret = -EINVAL; |
| } |
| out_unlock: |
| kbase_gpu_vm_unlock(kctx); |
| return ret; |
| } |
| |
| #if !MALI_USE_CSF |
| static int kbase_debug_copy(struct kbase_jd_atom *katom) |
| { |
| struct kbase_debug_copy_buffer *buffers = katom->softjob_data; |
| unsigned int i; |
| |
| if (WARN_ON(!buffers)) |
| return -EINVAL; |
| |
| for (i = 0; i < katom->nr_extres; i++) { |
| int res = kbase_mem_copy_from_extres(katom->kctx, &buffers[i]); |
| |
| if (res) |
| return res; |
| } |
| |
| return 0; |
| } |
| #endif /* !MALI_USE_CSF */ |
| |
| #define KBASEP_JIT_ALLOC_GPU_ADDR_ALIGNMENT ((u32)0x7) |
| |
| int kbasep_jit_alloc_validate(struct kbase_context *kctx, |
| struct base_jit_alloc_info *info) |
| { |
| int j; |
| /* If the ID is zero, then fail the job */ |
| if (info->id == 0) |
| return -EINVAL; |
| |
| /* Sanity check that the PA fits within the VA */ |
| if (info->va_pages < info->commit_pages) |
| return -EINVAL; |
| |
| /* Ensure the GPU address is correctly aligned */ |
| if ((info->gpu_alloc_addr & KBASEP_JIT_ALLOC_GPU_ADDR_ALIGNMENT) != 0) |
| return -EINVAL; |
| |
| /* Interface version 2 (introduced with kernel driver version 11.5) |
| * onward has padding and a flags member to validate. |
| * |
| * Note: To support earlier versions the extra bytes will have been set |
| * to 0 by the caller. |
| */ |
| |
| /* Check padding is all zeroed */ |
| for (j = 0; j < sizeof(info->padding); j++) { |
| if (info->padding[j] != 0) |
| return -EINVAL; |
| } |
| |
| /* Only valid flags shall be set */ |
| if (info->flags & ~(BASE_JIT_ALLOC_VALID_FLAGS)) |
| return -EINVAL; |
| |
| #if !MALI_JIT_PRESSURE_LIMIT_BASE |
| /* If just-in-time memory allocation pressure limit feature is disabled, |
| * heap_info_gpu_addr must be zeroed-out |
| */ |
| if (info->heap_info_gpu_addr) |
| return -EINVAL; |
| #endif |
| |
| #if !MALI_USE_CSF |
| /* If BASE_JIT_ALLOC_HEAP_INFO_IS_SIZE is set, heap_info_gpu_addr |
| * cannot be 0 |
| */ |
| if ((info->flags & BASE_JIT_ALLOC_HEAP_INFO_IS_SIZE) && |
| !info->heap_info_gpu_addr) |
| return -EINVAL; |
| #endif /* !MALI_USE_CSF */ |
| |
| return 0; |
| } |
| |
| #if !MALI_USE_CSF |
| |
| /* |
| * Sizes of user data to copy for each just-in-time memory interface version |
| * |
| * In interface version 2 onwards this is the same as the struct size, allowing |
| * copying of arrays of structures from userspace. |
| * |
| * In interface version 1 the structure size was variable, and hence arrays of |
| * structures cannot be supported easily, and were not a feature present in |
| * version 1 anyway. |
| */ |
| static const size_t jit_info_copy_size_for_jit_version[] = { |
| /* in jit_version 1, the structure did not have any end padding, hence |
| * it could be a different size on 32 and 64-bit clients. We therefore |
| * do not copy past the last member |
| */ |
| [1] = offsetofend(struct base_jit_alloc_info_10_2, id), |
| [2] = sizeof(struct base_jit_alloc_info_11_5), |
| [3] = sizeof(struct base_jit_alloc_info) |
| }; |
| |
| static int kbase_jit_allocate_prepare(struct kbase_jd_atom *katom) |
| { |
| __user u8 *data = (__user u8 *)(uintptr_t) katom->jc; |
| struct base_jit_alloc_info *info; |
| struct kbase_context *kctx = katom->kctx; |
| struct kbase_device *kbdev = kctx->kbdev; |
| u32 count; |
| int ret; |
| u32 i; |
| size_t jit_info_user_copy_size; |
| |
| WARN_ON(kctx->jit_version >= |
| ARRAY_SIZE(jit_info_copy_size_for_jit_version)); |
| jit_info_user_copy_size = |
| jit_info_copy_size_for_jit_version[kctx->jit_version]; |
| WARN_ON(jit_info_user_copy_size > sizeof(*info)); |
| |
| /* For backwards compatibility, and to prevent reading more than 1 jit |
| * info struct on jit version 1 |
| */ |
| if (katom->nr_extres == 0 || kctx->jit_version == 1) |
| katom->nr_extres = 1; |
| count = katom->nr_extres; |
| |
| /* Sanity checks */ |
| if (!data || count > kctx->jit_max_allocations || |
| count > ARRAY_SIZE(kctx->jit_alloc)) { |
| ret = -EINVAL; |
| goto fail; |
| } |
| |
| /* Copy the information for safe access and future storage */ |
| info = kmalloc_array(count, sizeof(*info), GFP_KERNEL); |
| if (!info) { |
| ret = -ENOMEM; |
| goto fail; |
| } |
| |
| katom->softjob_data = info; |
| |
| for (i = 0; i < count; i++, info++, data += jit_info_user_copy_size) { |
| if (copy_from_user(info, data, jit_info_user_copy_size) != 0) { |
| ret = -EINVAL; |
| goto free_info; |
| } |
| /* Clear any remaining bytes when user struct is smaller than |
| * kernel struct. For jit version 1, this also clears the |
| * padding bytes |
| */ |
| memset(((u8 *)info) + jit_info_user_copy_size, 0, |
| sizeof(*info) - jit_info_user_copy_size); |
| |
| ret = kbasep_jit_alloc_validate(kctx, info); |
| if (ret) |
| goto free_info; |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_JITALLOCINFO( |
| kbdev, katom, info->va_pages, info->commit_pages, |
| info->extension, info->id, info->bin_id, |
| info->max_allocations, info->flags, info->usage_id); |
| } |
| |
| katom->jit_blocked = false; |
| |
| lockdep_assert_held(&kctx->jctx.lock); |
| list_add_tail(&katom->jit_node, &kctx->jctx.jit_atoms_head); |
| |
| /* |
| * Note: |
| * The provided info->gpu_alloc_addr isn't validated here as |
| * userland can cache allocations which means that even |
| * though the region is valid it doesn't represent the |
| * same thing it used to. |
| * |
| * Complete validation of va_pages, commit_pages and extension |
| * isn't done here as it will be done during the call to |
| * kbase_mem_alloc. |
| */ |
| return 0; |
| |
| free_info: |
| kfree(katom->softjob_data); |
| katom->softjob_data = NULL; |
| fail: |
| return ret; |
| } |
| |
| static u8 *kbase_jit_free_get_ids(struct kbase_jd_atom *katom) |
| { |
| if (WARN_ON((katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) != |
| BASE_JD_REQ_SOFT_JIT_FREE)) |
| return NULL; |
| |
| return (u8 *) katom->softjob_data; |
| } |
| |
| static void kbase_jit_add_to_pending_alloc_list(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct list_head *target_list_head = NULL; |
| struct kbase_jd_atom *entry; |
| |
| list_for_each_entry(entry, &kctx->jctx.jit_pending_alloc, queue) { |
| if (katom->age < entry->age) { |
| target_list_head = &entry->queue; |
| break; |
| } |
| } |
| |
| if (target_list_head == NULL) |
| target_list_head = &kctx->jctx.jit_pending_alloc; |
| |
| list_add_tail(&katom->queue, target_list_head); |
| } |
| |
| static int kbase_jit_allocate_process(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct kbase_device *kbdev = kctx->kbdev; |
| struct base_jit_alloc_info *info; |
| struct kbase_va_region *reg; |
| struct kbase_vmap_struct mapping; |
| u64 *ptr, new_addr; |
| u32 count = katom->nr_extres; |
| u32 i; |
| bool ignore_pressure_limit = false; |
| |
| trace_sysgraph(SGR_SUBMIT, kctx->id, |
| kbase_jd_atom_id(kctx, katom)); |
| |
| if (katom->jit_blocked) { |
| list_del(&katom->queue); |
| katom->jit_blocked = false; |
| } |
| |
| info = katom->softjob_data; |
| if (WARN_ON(!info)) { |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| return 0; |
| } |
| |
| for (i = 0; i < count; i++, info++) { |
| /* The JIT ID is still in use so fail the allocation */ |
| if (kctx->jit_alloc[info->id]) { |
| katom->event_code = BASE_JD_EVENT_MEM_GROWTH_FAILED; |
| return 0; |
| } |
| } |
| |
| #if MALI_JIT_PRESSURE_LIMIT_BASE |
| /* |
| * If this is the only JIT_ALLOC atom in-flight or if JIT pressure limit |
| * is disabled at the context scope, then bypass JIT pressure limit |
| * logic in kbase_jit_allocate(). |
| */ |
| if (!kbase_ctx_flag(kctx, KCTX_JPL_ENABLED) |
| || (kctx->jit_current_allocations == 0)) { |
| ignore_pressure_limit = true; |
| } |
| #else |
| ignore_pressure_limit = true; |
| #endif /* MALI_JIT_PRESSURE_LIMIT_BASE */ |
| |
| for (i = 0, info = katom->softjob_data; i < count; i++, info++) { |
| if (kctx->jit_alloc[info->id]) { |
| /* The JIT ID is duplicated in this atom. Roll back |
| * previous allocations and fail. |
| */ |
| u32 j; |
| |
| info = katom->softjob_data; |
| for (j = 0; j < i; j++, info++) { |
| kbase_jit_free(kctx, kctx->jit_alloc[info->id]); |
| kctx->jit_alloc[info->id] = |
| KBASE_RESERVED_REG_JIT_ALLOC; |
| } |
| |
| katom->event_code = BASE_JD_EVENT_MEM_GROWTH_FAILED; |
| return 0; |
| } |
| |
| /* Create a JIT allocation */ |
| reg = kbase_jit_allocate(kctx, info, ignore_pressure_limit); |
| if (!reg) { |
| struct kbase_jd_atom *jit_atom; |
| bool can_block = false; |
| |
| lockdep_assert_held(&kctx->jctx.lock); |
| |
| list_for_each_entry(jit_atom, &kctx->jctx.jit_atoms_head, jit_node) { |
| if (jit_atom == katom) |
| break; |
| |
| if ((jit_atom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) == |
| BASE_JD_REQ_SOFT_JIT_FREE) { |
| u8 *free_ids = kbase_jit_free_get_ids(jit_atom); |
| |
| if (free_ids && *free_ids && |
| kctx->jit_alloc[*free_ids]) { |
| /* A JIT free which is active and |
| * submitted before this atom |
| */ |
| can_block = true; |
| break; |
| } |
| } |
| } |
| |
| if (!can_block) { |
| /* Mark the failed allocation as well as the |
| * other un-attempted allocations in the set, |
| * so we know they are in use even if the |
| * allocation itself failed. |
| */ |
| for (; i < count; i++, info++) { |
| kctx->jit_alloc[info->id] = |
| KBASE_RESERVED_REG_JIT_ALLOC; |
| } |
| |
| katom->event_code = BASE_JD_EVENT_MEM_GROWTH_FAILED; |
| dev_warn_ratelimited(kbdev->dev, "JIT alloc softjob failed: atom id %d\n", |
| kbase_jd_atom_id(kctx, katom)); |
| return 0; |
| } |
| |
| /* There are pending frees for an active allocation |
| * so we should wait to see whether they free the |
| * memory. Add to the list of atoms for which JIT |
| * allocation is pending. |
| */ |
| kbase_jit_add_to_pending_alloc_list(katom); |
| katom->jit_blocked = true; |
| |
| /* Rollback, the whole set will be re-attempted */ |
| while (i-- > 0) { |
| info--; |
| kbase_jit_free(kctx, kctx->jit_alloc[info->id]); |
| kctx->jit_alloc[info->id] = NULL; |
| } |
| |
| return 1; |
| } |
| |
| /* Bind it to the user provided ID. */ |
| kctx->jit_alloc[info->id] = reg; |
| } |
| |
| for (i = 0, info = katom->softjob_data; i < count; i++, info++) { |
| u64 entry_mmu_flags = 0; |
| /* |
| * Write the address of the JIT allocation to the user provided |
| * GPU allocation. |
| */ |
| ptr = kbase_vmap_prot(kctx, info->gpu_alloc_addr, sizeof(*ptr), |
| KBASE_REG_CPU_WR, &mapping); |
| if (!ptr) { |
| /* |
| * Leave the allocations "live" as the JIT free atom |
| * will be submitted anyway. |
| */ |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| return 0; |
| } |
| |
| reg = kctx->jit_alloc[info->id]; |
| new_addr = reg->start_pfn << PAGE_SHIFT; |
| *ptr = new_addr; |
| |
| #if defined(CONFIG_MALI_VECTOR_DUMP) |
| /* |
| * Retrieve the mmu flags for JIT allocation |
| * only if dumping is enabled |
| */ |
| entry_mmu_flags = kbase_mmu_create_ate(kbdev, |
| (struct tagged_addr){ 0 }, reg->flags, |
| MIDGARD_MMU_BOTTOMLEVEL, kctx->jit_group_id); |
| #endif |
| |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_JIT( |
| kbdev, katom, info->gpu_alloc_addr, new_addr, |
| info->flags, entry_mmu_flags, info->id, |
| info->commit_pages, info->extension, info->va_pages); |
| kbase_vunmap(kctx, &mapping); |
| |
| kbase_trace_jit_report_gpu_mem(kctx, reg, |
| KBASE_JIT_REPORT_ON_ALLOC_OR_FREE); |
| } |
| |
| katom->event_code = BASE_JD_EVENT_DONE; |
| |
| return 0; |
| } |
| |
| static void kbase_jit_allocate_finish(struct kbase_jd_atom *katom) |
| { |
| struct base_jit_alloc_info *info; |
| |
| lockdep_assert_held(&katom->kctx->jctx.lock); |
| |
| if (WARN_ON(!katom->softjob_data)) |
| return; |
| |
| /* Remove atom from jit_atoms_head list */ |
| list_del(&katom->jit_node); |
| |
| if (katom->jit_blocked) { |
| list_del(&katom->queue); |
| katom->jit_blocked = false; |
| } |
| |
| info = katom->softjob_data; |
| /* Free the info structure */ |
| kfree(info); |
| } |
| |
| static int kbase_jit_free_prepare(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| struct kbase_device *kbdev = kctx->kbdev; |
| __user void *data = (__user void *)(uintptr_t) katom->jc; |
| u8 *ids; |
| u32 count = MAX(katom->nr_extres, 1); |
| u32 i; |
| int ret; |
| |
| /* Sanity checks */ |
| if (count > ARRAY_SIZE(kctx->jit_alloc)) { |
| ret = -EINVAL; |
| goto fail; |
| } |
| |
| /* Copy the information for safe access and future storage */ |
| ids = kmalloc_array(count, sizeof(*ids), GFP_KERNEL); |
| if (!ids) { |
| ret = -ENOMEM; |
| goto fail; |
| } |
| |
| lockdep_assert_held(&kctx->jctx.lock); |
| katom->softjob_data = ids; |
| |
| /* For backwards compatibility */ |
| if (katom->nr_extres) { |
| /* Fail the job if there is no list of ids */ |
| if (!data) { |
| ret = -EINVAL; |
| goto free_info; |
| } |
| |
| if (copy_from_user(ids, data, sizeof(*ids)*count) != 0) { |
| ret = -EINVAL; |
| goto free_info; |
| } |
| } else { |
| katom->nr_extres = 1; |
| *ids = (u8)katom->jc; |
| } |
| for (i = 0; i < count; i++) |
| KBASE_TLSTREAM_TL_ATTRIB_ATOM_JITFREEINFO(kbdev, katom, ids[i]); |
| |
| list_add_tail(&katom->jit_node, &kctx->jctx.jit_atoms_head); |
| |
| return 0; |
| |
| free_info: |
| kfree(katom->softjob_data); |
| katom->softjob_data = NULL; |
| fail: |
| return ret; |
| } |
| |
| static void kbase_jit_free_process(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| u8 *ids = kbase_jit_free_get_ids(katom); |
| u32 count = katom->nr_extres; |
| u32 i; |
| |
| if (ids == NULL) { |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| return; |
| } |
| |
| for (i = 0; i < count; i++, ids++) { |
| /* |
| * If the ID is zero or it is not in use yet then fail the job. |
| */ |
| if ((*ids == 0) || (kctx->jit_alloc[*ids] == NULL)) { |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| return; |
| } |
| } |
| } |
| |
| static void kbasep_jit_finish_worker(struct work_struct *work) |
| { |
| struct kbase_jd_atom *katom = container_of(work, struct kbase_jd_atom, |
| work); |
| struct kbase_context *kctx = katom->kctx; |
| int resched; |
| |
| mutex_lock(&kctx->jctx.lock); |
| kbase_finish_soft_job(katom); |
| resched = kbase_jd_done_nolock(katom, true); |
| mutex_unlock(&kctx->jctx.lock); |
| |
| if (resched) |
| kbase_js_sched_all(kctx->kbdev); |
| } |
| |
| void kbase_jit_retry_pending_alloc(struct kbase_context *kctx) |
| { |
| LIST_HEAD(jit_pending_alloc_list); |
| struct list_head *i, *tmp; |
| |
| list_splice_tail_init(&kctx->jctx.jit_pending_alloc, |
| &jit_pending_alloc_list); |
| |
| list_for_each_safe(i, tmp, &jit_pending_alloc_list) { |
| struct kbase_jd_atom *pending_atom = list_entry(i, |
| struct kbase_jd_atom, queue); |
| KBASE_TLSTREAM_TL_EVENT_ATOM_SOFTJOB_START(kctx->kbdev, pending_atom); |
| kbase_kinstr_jm_atom_sw_start(pending_atom); |
| if (kbase_jit_allocate_process(pending_atom) == 0) { |
| /* Atom has completed */ |
| INIT_WORK(&pending_atom->work, |
| kbasep_jit_finish_worker); |
| queue_work(kctx->jctx.job_done_wq, &pending_atom->work); |
| } |
| KBASE_TLSTREAM_TL_EVENT_ATOM_SOFTJOB_END(kctx->kbdev, pending_atom); |
| kbase_kinstr_jm_atom_sw_stop(pending_atom); |
| } |
| } |
| |
| static void kbase_jit_free_finish(struct kbase_jd_atom *katom) |
| { |
| struct kbase_context *kctx = katom->kctx; |
| u8 *ids; |
| size_t j; |
| |
| lockdep_assert_held(&kctx->jctx.lock); |
| |
| ids = kbase_jit_free_get_ids(katom); |
| if (WARN_ON(ids == NULL)) |
| return; |
| |
| /* Remove this atom from the jit_atoms_head list */ |
| list_del(&katom->jit_node); |
| |
| for (j = 0; j != katom->nr_extres; ++j) { |
| if ((ids[j] != 0) && (kctx->jit_alloc[ids[j]] != NULL)) { |
| /* |
| * If the ID is valid but the allocation request failed |
| * still succeed this soft job but don't try and free |
| * the allocation. |
| */ |
| if (kctx->jit_alloc[ids[j]] != |
| KBASE_RESERVED_REG_JIT_ALLOC) { |
| KBASE_TLSTREAM_TL_JIT_USEDPAGES(kctx->kbdev, |
| kctx->jit_alloc[ids[j]]-> |
| gpu_alloc->nents, ids[j]); |
| kbase_jit_free(kctx, kctx->jit_alloc[ids[j]]); |
| } |
| kctx->jit_alloc[ids[j]] = NULL; |
| } |
| } |
| /* Free the list of ids */ |
| kfree(ids); |
| |
| kbase_jit_retry_pending_alloc(kctx); |
| } |
| |
| static int kbase_ext_res_prepare(struct kbase_jd_atom *katom) |
| { |
| __user struct base_external_resource_list *user_ext_res; |
| struct base_external_resource_list *ext_res; |
| u64 count = 0; |
| size_t copy_size; |
| |
| user_ext_res = (__user struct base_external_resource_list *) |
| (uintptr_t) katom->jc; |
| |
| /* Fail the job if there is no info structure */ |
| if (!user_ext_res) |
| return -EINVAL; |
| |
| if (copy_from_user(&count, &user_ext_res->count, sizeof(u64)) != 0) |
| return -EINVAL; |
| |
| /* Is the number of external resources in range? */ |
| if (!count || count > BASE_EXT_RES_COUNT_MAX) |
| return -EINVAL; |
| |
| /* Copy the information for safe access and future storage */ |
| copy_size = sizeof(*ext_res); |
| copy_size += sizeof(struct base_external_resource) * (count - 1); |
| ext_res = memdup_user(user_ext_res, copy_size); |
| if (IS_ERR(ext_res)) |
| return PTR_ERR(ext_res); |
| |
| /* |
| * Overwrite the count with the first value incase it was changed |
| * after the fact. |
| */ |
| ext_res->count = count; |
| |
| katom->softjob_data = ext_res; |
| |
| return 0; |
| } |
| |
| static void kbase_ext_res_process(struct kbase_jd_atom *katom, bool map) |
| { |
| struct base_external_resource_list *ext_res; |
| int i; |
| bool failed = false; |
| |
| ext_res = katom->softjob_data; |
| if (!ext_res) |
| goto failed_jc; |
| |
| kbase_gpu_vm_lock(katom->kctx); |
| |
| for (i = 0; i < ext_res->count; i++) { |
| u64 gpu_addr; |
| |
| gpu_addr = ext_res->ext_res[i].ext_resource & |
| ~BASE_EXT_RES_ACCESS_EXCLUSIVE; |
| if (map) { |
| if (!kbase_sticky_resource_acquire(katom->kctx, |
| gpu_addr)) |
| goto failed_loop; |
| } else { |
| if (!kbase_sticky_resource_release_force(katom->kctx, NULL, |
| gpu_addr)) |
| failed = true; |
| } |
| } |
| |
| /* |
| * In the case of unmap we continue unmapping other resources in the |
| * case of failure but will always report failure if _any_ unmap |
| * request fails. |
| */ |
| if (failed) |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| else |
| katom->event_code = BASE_JD_EVENT_DONE; |
| |
| kbase_gpu_vm_unlock(katom->kctx); |
| |
| return; |
| |
| failed_loop: |
| while (i > 0) { |
| u64 const gpu_addr = ext_res->ext_res[i - 1].ext_resource & |
| ~BASE_EXT_RES_ACCESS_EXCLUSIVE; |
| |
| kbase_sticky_resource_release_force(katom->kctx, NULL, gpu_addr); |
| |
| --i; |
| } |
| |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| kbase_gpu_vm_unlock(katom->kctx); |
| |
| failed_jc: |
| return; |
| } |
| |
| static void kbase_ext_res_finish(struct kbase_jd_atom *katom) |
| { |
| struct base_external_resource_list *ext_res; |
| |
| ext_res = katom->softjob_data; |
| /* Free the info structure */ |
| kfree(ext_res); |
| } |
| |
| int kbase_process_soft_job(struct kbase_jd_atom *katom) |
| { |
| int ret = 0; |
| struct kbase_context *kctx = katom->kctx; |
| struct kbase_device *kbdev = kctx->kbdev; |
| |
| KBASE_TLSTREAM_TL_EVENT_ATOM_SOFTJOB_START(kbdev, katom); |
| kbase_kinstr_jm_atom_sw_start(katom); |
| |
| trace_sysgraph(SGR_SUBMIT, kctx->id, |
| kbase_jd_atom_id(kctx, katom)); |
| |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| case BASE_JD_REQ_SOFT_DUMP_CPU_GPU_TIME: |
| ret = kbase_dump_cpu_gpu_time(katom); |
| break; |
| |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| case BASE_JD_REQ_SOFT_FENCE_TRIGGER: |
| katom->event_code = kbase_sync_fence_out_trigger(katom, |
| katom->event_code == BASE_JD_EVENT_DONE ? |
| 0 : -EFAULT); |
| break; |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| { |
| ret = kbase_sync_fence_in_wait(katom); |
| |
| if (ret == 1) { |
| #ifdef CONFIG_MALI_FENCE_DEBUG |
| kbasep_add_waiting_with_timeout(katom); |
| #else |
| kbasep_add_waiting_soft_job(katom); |
| #endif |
| } |
| break; |
| } |
| #endif |
| case BASE_JD_REQ_SOFT_EVENT_WAIT: |
| ret = kbasep_soft_event_wait(katom); |
| break; |
| case BASE_JD_REQ_SOFT_EVENT_SET: |
| kbasep_soft_event_update_locked(katom, BASE_JD_SOFT_EVENT_SET); |
| break; |
| case BASE_JD_REQ_SOFT_EVENT_RESET: |
| kbasep_soft_event_update_locked(katom, BASE_JD_SOFT_EVENT_RESET); |
| break; |
| case BASE_JD_REQ_SOFT_DEBUG_COPY: |
| { |
| int res = kbase_debug_copy(katom); |
| |
| if (res) |
| katom->event_code = BASE_JD_EVENT_JOB_INVALID; |
| break; |
| } |
| case BASE_JD_REQ_SOFT_JIT_ALLOC: |
| ret = kbase_jit_allocate_process(katom); |
| break; |
| case BASE_JD_REQ_SOFT_JIT_FREE: |
| kbase_jit_free_process(katom); |
| break; |
| case BASE_JD_REQ_SOFT_EXT_RES_MAP: |
| kbase_ext_res_process(katom, true); |
| break; |
| case BASE_JD_REQ_SOFT_EXT_RES_UNMAP: |
| kbase_ext_res_process(katom, false); |
| break; |
| } |
| |
| /* Atom is complete */ |
| KBASE_TLSTREAM_TL_EVENT_ATOM_SOFTJOB_END(kbdev, katom); |
| kbase_kinstr_jm_atom_sw_stop(katom); |
| return ret; |
| } |
| |
| void kbase_cancel_soft_job(struct kbase_jd_atom *katom) |
| { |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| kbase_sync_fence_in_cancel_wait(katom); |
| break; |
| #endif |
| case BASE_JD_REQ_SOFT_EVENT_WAIT: |
| kbasep_soft_event_cancel_job(katom); |
| break; |
| default: |
| /* This soft-job doesn't support cancellation! */ |
| KBASE_DEBUG_ASSERT(0); |
| } |
| } |
| |
| int kbase_prepare_soft_job(struct kbase_jd_atom *katom) |
| { |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| case BASE_JD_REQ_SOFT_DUMP_CPU_GPU_TIME: |
| { |
| if (!IS_ALIGNED(katom->jc, cache_line_size())) |
| return -EINVAL; |
| } |
| break; |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| case BASE_JD_REQ_SOFT_FENCE_TRIGGER: |
| { |
| struct base_fence fence; |
| int fd; |
| |
| if (copy_from_user(&fence, |
| (__user void *)(uintptr_t)katom->jc, |
| sizeof(fence)) != 0) |
| return -EINVAL; |
| |
| fd = kbase_sync_fence_out_create(katom, |
| fence.basep.stream_fd); |
| if (fd < 0) |
| return -EINVAL; |
| |
| fence.basep.fd = fd; |
| if (copy_to_user((__user void *)(uintptr_t)katom->jc, |
| &fence, sizeof(fence)) != 0) { |
| kbase_sync_fence_out_remove(katom); |
| /* fd should have been closed here, but there's |
| * no good way of doing that. Since |
| * copy_to_user() very rarely fails, and the fd |
| * will get closed on process termination this |
| * won't be a problem. |
| */ |
| fence.basep.fd = -EINVAL; |
| return -EINVAL; |
| } |
| } |
| break; |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| { |
| struct base_fence fence; |
| int ret; |
| |
| if (copy_from_user(&fence, |
| (__user void *)(uintptr_t)katom->jc, |
| sizeof(fence)) != 0) |
| return -EINVAL; |
| |
| /* Get a reference to the fence object */ |
| ret = kbase_sync_fence_in_from_fd(katom, |
| fence.basep.fd); |
| if (ret < 0) |
| return ret; |
| |
| #ifdef CONFIG_MALI_DMA_FENCE |
| /* |
| * Set KCTX_NO_IMPLICIT_FENCE in the context the first |
| * time a soft fence wait job is observed. This will |
| * prevent the implicit dma-buf fence to conflict with |
| * the Android native sync fences. |
| */ |
| if (!kbase_ctx_flag(katom->kctx, KCTX_NO_IMPLICIT_SYNC)) |
| kbase_ctx_flag_set(katom->kctx, KCTX_NO_IMPLICIT_SYNC); |
| #endif /* CONFIG_MALI_DMA_FENCE */ |
| } |
| break; |
| #endif /* CONFIG_SYNC || CONFIG_SYNC_FILE */ |
| case BASE_JD_REQ_SOFT_JIT_ALLOC: |
| return kbase_jit_allocate_prepare(katom); |
| case BASE_JD_REQ_SOFT_JIT_FREE: |
| return kbase_jit_free_prepare(katom); |
| case BASE_JD_REQ_SOFT_EVENT_WAIT: |
| case BASE_JD_REQ_SOFT_EVENT_SET: |
| case BASE_JD_REQ_SOFT_EVENT_RESET: |
| if (katom->jc == 0) |
| return -EINVAL; |
| break; |
| case BASE_JD_REQ_SOFT_DEBUG_COPY: |
| return kbase_debug_copy_prepare(katom); |
| case BASE_JD_REQ_SOFT_EXT_RES_MAP: |
| return kbase_ext_res_prepare(katom); |
| case BASE_JD_REQ_SOFT_EXT_RES_UNMAP: |
| return kbase_ext_res_prepare(katom); |
| default: |
| /* Unsupported soft-job */ |
| return -EINVAL; |
| } |
| return 0; |
| } |
| |
| void kbase_finish_soft_job(struct kbase_jd_atom *katom) |
| { |
| trace_sysgraph(SGR_COMPLETE, katom->kctx->id, |
| kbase_jd_atom_id(katom->kctx, katom)); |
| |
| switch (katom->core_req & BASE_JD_REQ_SOFT_JOB_TYPE) { |
| case BASE_JD_REQ_SOFT_DUMP_CPU_GPU_TIME: |
| /* Nothing to do */ |
| break; |
| #if defined(CONFIG_SYNC) || defined(CONFIG_SYNC_FILE) |
| case BASE_JD_REQ_SOFT_FENCE_TRIGGER: |
| /* If fence has not yet been signaled, do it now */ |
| kbase_sync_fence_out_trigger(katom, katom->event_code == |
| BASE_JD_EVENT_DONE ? 0 : -EFAULT); |
| break; |
| case BASE_JD_REQ_SOFT_FENCE_WAIT: |
| /* Release katom's reference to fence object */ |
| kbase_sync_fence_in_remove(katom); |
| break; |
| #endif /* CONFIG_SYNC || CONFIG_SYNC_FILE */ |
| case BASE_JD_REQ_SOFT_DEBUG_COPY: |
| kbase_debug_copy_finish(katom); |
| break; |
| case BASE_JD_REQ_SOFT_JIT_ALLOC: |
| kbase_jit_allocate_finish(katom); |
| break; |
| case BASE_JD_REQ_SOFT_EXT_RES_MAP: |
| kbase_ext_res_finish(katom); |
| break; |
| case BASE_JD_REQ_SOFT_EXT_RES_UNMAP: |
| kbase_ext_res_finish(katom); |
| break; |
| case BASE_JD_REQ_SOFT_JIT_FREE: |
| kbase_jit_free_finish(katom); |
| break; |
| } |
| } |
| |
| void kbase_resume_suspended_soft_jobs(struct kbase_device *kbdev) |
| { |
| LIST_HEAD(local_suspended_soft_jobs); |
| struct kbase_jd_atom *tmp_iter; |
| struct kbase_jd_atom *katom_iter; |
| struct kbasep_js_device_data *js_devdata; |
| bool resched = false; |
| |
| KBASE_DEBUG_ASSERT(kbdev); |
| |
| js_devdata = &kbdev->js_data; |
| |
| /* Move out the entire list */ |
| mutex_lock(&js_devdata->runpool_mutex); |
| list_splice_init(&js_devdata->suspended_soft_jobs_list, |
| &local_suspended_soft_jobs); |
| mutex_unlock(&js_devdata->runpool_mutex); |
| |
| /* |
| * Each atom must be detached from the list and ran separately - |
| * it could be re-added to the old list, but this is unlikely |
| */ |
| list_for_each_entry_safe(katom_iter, tmp_iter, |
| &local_suspended_soft_jobs, dep_item[1]) { |
| struct kbase_context *kctx = katom_iter->kctx; |
| |
| mutex_lock(&kctx->jctx.lock); |
| |
| /* Remove from the global list */ |
| list_del(&katom_iter->dep_item[1]); |
| /* Remove from the context's list of waiting soft jobs */ |
| kbasep_remove_waiting_soft_job(katom_iter); |
| |
| if (kbase_process_soft_job(katom_iter) == 0) { |
| kbase_finish_soft_job(katom_iter); |
| resched |= kbase_jd_done_nolock(katom_iter, true); |
| #ifdef CONFIG_MALI_ARBITER_SUPPORT |
| atomic_dec(&kbdev->pm.gpu_users_waiting); |
| #endif /* CONFIG_MALI_ARBITER_SUPPORT */ |
| } |
| mutex_unlock(&kctx->jctx.lock); |
| } |
| |
| if (resched) |
| kbase_js_sched_all(kbdev); |
| } |
| #endif /* !MALI_USE_CSF */ |