| // SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note |
| /* |
| * |
| * (C) COPYRIGHT 2014-2016, 2018-2022 ARM Limited. All rights reserved. |
| * |
| * This program is free software and is provided to you under the terms of the |
| * GNU General Public License version 2 as published by the Free Software |
| * Foundation, and any use by you of this program is subject to the terms |
| * of such GNU license. |
| * |
| * This program is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| * GNU General Public License for more details. |
| * |
| * You should have received a copy of the GNU General Public License |
| * along with this program; if not, you can access it online at |
| * http://www.gnu.org/licenses/gpl-2.0.html. |
| * |
| */ |
| |
| #include <mali_kbase.h> |
| #include <gpu/mali_kbase_gpu_fault.h> |
| #include <backend/gpu/mali_kbase_instr_internal.h> |
| #include <backend/gpu/mali_kbase_pm_internal.h> |
| #include <device/mali_kbase_device.h> |
| #include <mali_kbase_reset_gpu.h> |
| #include <mmu/mali_kbase_mmu.h> |
| |
| #define U64_LO_MASK ((1ULL << 32) - 1) |
| #define U64_HI_MASK (~U64_LO_MASK) |
| |
| #if !IS_ENABLED(CONFIG_MALI_NO_MALI) |
| bool kbase_is_gpu_removed(struct kbase_device *kbdev) |
| { |
| u32 val; |
| |
| val = kbase_reg_read(kbdev, GPU_CONTROL_REG(GPU_ID)); |
| |
| return val == 0; |
| } |
| #endif /* !IS_ENABLED(CONFIG_MALI_NO_MALI) */ |
| |
| static int busy_wait_on_irq(struct kbase_device *kbdev, u32 irq_bit) |
| { |
| char *irq_flag_name; |
| /* Previously MMU-AS command was used for L2 cache flush on page-table update. |
| * And we're using the same max-loops count for GPU command, because amount of |
| * L2 cache flush overhead are same between them. |
| */ |
| unsigned int max_loops = KBASE_AS_INACTIVE_MAX_LOOPS; |
| |
| /* Wait for the GPU cache clean operation to complete */ |
| while (--max_loops && |
| !(kbase_reg_read(kbdev, GPU_CONTROL_REG(GPU_IRQ_RAWSTAT)) & irq_bit)) { |
| ; |
| } |
| |
| /* reset gpu if time-out occurred */ |
| if (max_loops == 0) { |
| switch (irq_bit) { |
| case CLEAN_CACHES_COMPLETED: |
| irq_flag_name = "CLEAN_CACHES_COMPLETED"; |
| break; |
| case FLUSH_PA_RANGE_COMPLETED: |
| irq_flag_name = "FLUSH_PA_RANGE_COMPLETED"; |
| break; |
| default: |
| irq_flag_name = "UNKNOWN"; |
| break; |
| } |
| |
| dev_err(kbdev->dev, |
| "Stuck waiting on %s bit, might be caused by slow/unstable GPU clock or possible faulty FPGA connector\n", |
| irq_flag_name); |
| |
| if (kbase_prepare_to_reset_gpu_locked(kbdev, RESET_FLAGS_NONE)) |
| kbase_reset_gpu_locked(kbdev); |
| return -EBUSY; |
| } |
| |
| /* Clear the interrupt bit. */ |
| KBASE_KTRACE_ADD(kbdev, CORE_GPU_IRQ_CLEAR, NULL, irq_bit); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_CLEAR), irq_bit); |
| |
| return 0; |
| } |
| |
| #define kbase_gpu_cache_flush_pa_range_and_busy_wait(kbdev, phys, nr_bytes, flush_op) (0) |
| |
| int kbase_gpu_cache_flush_and_busy_wait(struct kbase_device *kbdev, |
| u32 flush_op) |
| { |
| int need_to_wake_up = 0; |
| int ret = 0; |
| |
| /* hwaccess_lock must be held to avoid any sync issue with |
| * kbase_gpu_start_cache_clean() / kbase_clean_caches_done() |
| */ |
| lockdep_assert_held(&kbdev->hwaccess_lock); |
| |
| /* 1. Check if kbdev->cache_clean_in_progress is set. |
| * If it is set, it means there are threads waiting for |
| * CLEAN_CACHES_COMPLETED irq to be raised and that the |
| * corresponding irq mask bit is set. |
| * We'll clear the irq mask bit and busy-wait for the cache |
| * clean operation to complete before submitting the cache |
| * clean command required after the GPU page table update. |
| * Pended flush commands will be merged to requested command. |
| */ |
| if (kbdev->cache_clean_in_progress) { |
| /* disable irq first */ |
| u32 irq_mask = kbase_reg_read(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK)); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK), |
| irq_mask & ~CLEAN_CACHES_COMPLETED); |
| |
| /* busy wait irq status to be enabled */ |
| ret = busy_wait_on_irq(kbdev, (u32)CLEAN_CACHES_COMPLETED); |
| if (ret) |
| return ret; |
| |
| /* merge pended command if there's any */ |
| flush_op = GPU_COMMAND_FLUSH_CACHE_MERGE( |
| kbdev->cache_clean_queued, flush_op); |
| |
| /* enable wake up notify flag */ |
| need_to_wake_up = 1; |
| } else { |
| /* Clear the interrupt CLEAN_CACHES_COMPLETED bit. */ |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_CLEAR), |
| CLEAN_CACHES_COMPLETED); |
| } |
| |
| /* 2. Issue GPU_CONTROL.COMMAND.FLUSH_CACHE operation. */ |
| KBASE_KTRACE_ADD(kbdev, CORE_GPU_CLEAN_INV_CACHES, NULL, flush_op); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_COMMAND), flush_op); |
| |
| /* 3. Busy-wait irq status to be enabled. */ |
| ret = busy_wait_on_irq(kbdev, (u32)CLEAN_CACHES_COMPLETED); |
| if (ret) |
| return ret; |
| |
| /* 4. Wake-up blocked threads when there is any. */ |
| if (need_to_wake_up) |
| kbase_gpu_cache_clean_wait_complete(kbdev); |
| |
| return ret; |
| } |
| |
| void kbase_gpu_start_cache_clean_nolock(struct kbase_device *kbdev, |
| u32 flush_op) |
| { |
| u32 irq_mask; |
| |
| lockdep_assert_held(&kbdev->hwaccess_lock); |
| |
| if (kbdev->cache_clean_in_progress) { |
| /* If this is called while another clean is in progress, we |
| * can't rely on the current one to flush any new changes in |
| * the cache. Instead, accumulate all cache clean operations |
| * and trigger that immediately after this one finishes. |
| */ |
| kbdev->cache_clean_queued = GPU_COMMAND_FLUSH_CACHE_MERGE( |
| kbdev->cache_clean_queued, flush_op); |
| return; |
| } |
| |
| /* Enable interrupt */ |
| irq_mask = kbase_reg_read(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK)); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK), |
| irq_mask | CLEAN_CACHES_COMPLETED); |
| |
| KBASE_KTRACE_ADD(kbdev, CORE_GPU_CLEAN_INV_CACHES, NULL, flush_op); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_COMMAND), flush_op); |
| |
| kbdev->cache_clean_in_progress = true; |
| } |
| |
| void kbase_gpu_start_cache_clean(struct kbase_device *kbdev, u32 flush_op) |
| { |
| unsigned long flags; |
| |
| spin_lock_irqsave(&kbdev->hwaccess_lock, flags); |
| kbase_gpu_start_cache_clean_nolock(kbdev, flush_op); |
| spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags); |
| } |
| |
| void kbase_gpu_cache_clean_wait_complete(struct kbase_device *kbdev) |
| { |
| lockdep_assert_held(&kbdev->hwaccess_lock); |
| |
| kbdev->cache_clean_queued = 0; |
| kbdev->cache_clean_in_progress = false; |
| wake_up(&kbdev->cache_clean_wait); |
| } |
| |
| void kbase_clean_caches_done(struct kbase_device *kbdev) |
| { |
| u32 irq_mask; |
| unsigned long flags; |
| |
| spin_lock_irqsave(&kbdev->hwaccess_lock, flags); |
| |
| if (kbdev->cache_clean_in_progress) { |
| /* Clear the interrupt CLEAN_CACHES_COMPLETED bit if set. |
| * It might have already been done by kbase_gpu_cache_flush_and_busy_wait. |
| */ |
| KBASE_KTRACE_ADD(kbdev, CORE_GPU_IRQ_CLEAR, NULL, CLEAN_CACHES_COMPLETED); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_CLEAR), CLEAN_CACHES_COMPLETED); |
| |
| if (kbdev->cache_clean_queued) { |
| u32 pended_flush_op = kbdev->cache_clean_queued; |
| |
| kbdev->cache_clean_queued = 0; |
| |
| KBASE_KTRACE_ADD(kbdev, CORE_GPU_CLEAN_INV_CACHES, NULL, pended_flush_op); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_COMMAND), pended_flush_op); |
| } else { |
| /* Disable interrupt */ |
| irq_mask = kbase_reg_read(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK)); |
| kbase_reg_write(kbdev, GPU_CONTROL_REG(GPU_IRQ_MASK), |
| irq_mask & ~CLEAN_CACHES_COMPLETED); |
| |
| kbase_gpu_cache_clean_wait_complete(kbdev); |
| } |
| } |
| |
| spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags); |
| } |
| |
| static inline bool get_cache_clean_flag(struct kbase_device *kbdev) |
| { |
| bool cache_clean_in_progress; |
| unsigned long flags; |
| |
| spin_lock_irqsave(&kbdev->hwaccess_lock, flags); |
| cache_clean_in_progress = kbdev->cache_clean_in_progress; |
| spin_unlock_irqrestore(&kbdev->hwaccess_lock, flags); |
| |
| return cache_clean_in_progress; |
| } |
| |
| void kbase_gpu_wait_cache_clean(struct kbase_device *kbdev) |
| { |
| while (get_cache_clean_flag(kbdev)) { |
| wait_event_interruptible(kbdev->cache_clean_wait, |
| !kbdev->cache_clean_in_progress); |
| } |
| } |
| |
| int kbase_gpu_wait_cache_clean_timeout(struct kbase_device *kbdev, |
| unsigned int wait_timeout_ms) |
| { |
| long remaining = msecs_to_jiffies(wait_timeout_ms); |
| |
| while (remaining && get_cache_clean_flag(kbdev)) { |
| remaining = wait_event_timeout(kbdev->cache_clean_wait, |
| !kbdev->cache_clean_in_progress, |
| remaining); |
| } |
| |
| return (remaining ? 0 : -ETIMEDOUT); |
| } |