arm/bifrost/mali_kbase_gpuprops.c

*4882a593Smuzhiyun// SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * (C) COPYRIGHT 2011-2022 ARM Limited. All rights reserved.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * This program is free software and is provided to you under the terms of the
*4882a593Smuzhiyun * GNU General Public License version 2 as published by the Free Software
*4882a593Smuzhiyun * Foundation, and any use by you of this program is subject to the terms
*4882a593Smuzhiyun * of such GNU license.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful,
*4882a593Smuzhiyun * but WITHOUT ANY WARRANTY; without even the implied warranty of
*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
*4882a593Smuzhiyun * GNU General Public License for more details.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * You should have received a copy of the GNU General Public License
*4882a593Smuzhiyun * along with this program; if not, you can access it online at
*4882a593Smuzhiyun * http://www.gnu.org/licenses/gpl-2.0.html.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun */
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * Base kernel property query APIs
*4882a593Smuzhiyun */
*4882a593Smuzhiyun
*4882a593Smuzhiyun#include <mali_kbase.h>
*4882a593Smuzhiyun#include <gpu/mali_kbase_gpu_regmap.h>
*4882a593Smuzhiyun#include <mali_kbase_gpuprops.h>
*4882a593Smuzhiyun#include <mali_kbase_hwaccess_gpuprops.h>
*4882a593Smuzhiyun#include <mali_kbase_config_defaults.h>
*4882a593Smuzhiyun#include <uapi/gpu/arm/bifrost/mali_kbase_ioctl.h>
*4882a593Smuzhiyun#include <linux/clk.h>
*4882a593Smuzhiyun#include <backend/gpu/mali_kbase_pm_internal.h>
*4882a593Smuzhiyun#include <linux/of_platform.h>
*4882a593Smuzhiyun#include <linux/moduleparam.h>
*4882a593Smuzhiyun
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic void kbase_gpuprops_construct_coherent_groups(
*4882a593Smuzhiyun	struct base_gpu_props * const props)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct mali_base_gpu_coherent_group *current_group;
*4882a593Smuzhiyun	u64 group_present;
*4882a593Smuzhiyun	u64 group_mask;
*4882a593Smuzhiyun	u64 first_set, first_set_prev;
*4882a593Smuzhiyun	u32 num_groups = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	KBASE_DEBUG_ASSERT(props != NULL);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	props->coherency_info.coherency = props->raw_props.mem_features;
*4882a593Smuzhiyun	props->coherency_info.num_core_groups = hweight64(props->raw_props.l2_present);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (props->coherency_info.coherency & GROUPS_L2_COHERENT) {
*4882a593Smuzhiyun		/* Group is l2 coherent */
*4882a593Smuzhiyun		group_present = props->raw_props.l2_present;
*4882a593Smuzhiyun	} else {
*4882a593Smuzhiyun		/* Group is l1 coherent */
*4882a593Smuzhiyun		group_present = props->raw_props.shader_present;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * The coherent group mask can be computed from the l2 present
*4882a593Smuzhiyun	 * register.
*4882a593Smuzhiyun	 *
*4882a593Smuzhiyun	 * For the coherent group n:
*4882a593Smuzhiyun	 * group_mask[n] = (first_set[n] - 1) & ~(first_set[n-1] - 1)
*4882a593Smuzhiyun	 * where first_set is group_present with only its nth set-bit kept
*4882a593Smuzhiyun	 * (i.e. the position from where a new group starts).
*4882a593Smuzhiyun	 *
*4882a593Smuzhiyun	 * For instance if the groups are l2 coherent and l2_present=0x0..01111:
*4882a593Smuzhiyun	 * The first mask is:
*4882a593Smuzhiyun	 * group_mask[1] = (first_set[1] - 1) & ~(first_set[0] - 1)
*4882a593Smuzhiyun	 *               = (0x0..010     - 1) & ~(0x0..01      - 1)
*4882a593Smuzhiyun	 *               =  0x0..00f
*4882a593Smuzhiyun	 * The second mask is:
*4882a593Smuzhiyun	 * group_mask[2] = (first_set[2] - 1) & ~(first_set[1] - 1)
*4882a593Smuzhiyun	 *               = (0x0..100     - 1) & ~(0x0..010     - 1)
*4882a593Smuzhiyun	 *               =  0x0..0f0
*4882a593Smuzhiyun	 * And so on until all the bits from group_present have been cleared
*4882a593Smuzhiyun	 * (i.e. there is no group left).
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun
*4882a593Smuzhiyun	current_group = props->coherency_info.group;
*4882a593Smuzhiyun	first_set = group_present & ~(group_present - 1);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	while (group_present != 0 && num_groups < BASE_MAX_COHERENT_GROUPS) {
*4882a593Smuzhiyun		group_present -= first_set;	/* Clear the current group bit */
*4882a593Smuzhiyun		first_set_prev = first_set;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		first_set = group_present & ~(group_present - 1);
*4882a593Smuzhiyun		group_mask = (first_set - 1) & ~(first_set_prev - 1);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Populate the coherent_group structure for each group */
*4882a593Smuzhiyun		current_group->core_mask = group_mask & props->raw_props.shader_present;
*4882a593Smuzhiyun		current_group->num_cores = hweight64(current_group->core_mask);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		num_groups++;
*4882a593Smuzhiyun		current_group++;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (group_present != 0)
*4882a593Smuzhiyun		pr_warn("Too many coherent groups (keeping only %d groups).\n", BASE_MAX_COHERENT_GROUPS);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	props->coherency_info.num_groups = num_groups;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_gpuprops_get_curr_config_props - Get the current allocated resources
*4882a593Smuzhiyun * @kbdev:       The &struct kbase_device structure for the device
*4882a593Smuzhiyun * @curr_config: The &struct curr_config_props structure to receive the result
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Fill the &struct curr_config_props structure with values from the GPU
*4882a593Smuzhiyun * configuration registers.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Return: Zero on success, Linux error code on failure
*4882a593Smuzhiyun */
*4882a593Smuzhiyunint kbase_gpuprops_get_curr_config_props(struct kbase_device *kbdev,
*4882a593Smuzhiyun	struct curr_config_props * const curr_config)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct kbase_current_config_regdump curr_config_regdump;
*4882a593Smuzhiyun	int err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (WARN_ON(!kbdev) || WARN_ON(!curr_config))
*4882a593Smuzhiyun		return -EINVAL;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* If update not needed just return. */
*4882a593Smuzhiyun	if (!curr_config->update_needed)
*4882a593Smuzhiyun		return 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Dump relevant registers */
*4882a593Smuzhiyun	err = kbase_backend_gpuprops_get_curr_config(kbdev,
*4882a593Smuzhiyun						     &curr_config_regdump);
*4882a593Smuzhiyun	if (err)
*4882a593Smuzhiyun		return err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	curr_config->l2_slices =
*4882a593Smuzhiyun		KBASE_UBFX32(curr_config_regdump.mem_features, 8U, 4) + 1;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	curr_config->l2_present =
*4882a593Smuzhiyun		((u64) curr_config_regdump.l2_present_hi << 32) +
*4882a593Smuzhiyun		curr_config_regdump.l2_present_lo;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	curr_config->shader_present =
*4882a593Smuzhiyun		((u64) curr_config_regdump.shader_present_hi << 32) +
*4882a593Smuzhiyun		curr_config_regdump.shader_present_lo;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	curr_config->num_cores = hweight64(curr_config->shader_present);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	curr_config->update_needed = false;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return 0;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_gpuprops_req_curr_config_update - Request Current Config Update
*4882a593Smuzhiyun * @kbdev: The &struct kbase_device structure for the device
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Requests the current configuration to be updated next time the
*4882a593Smuzhiyun * kbase_gpuprops_get_curr_config_props() is called.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Return: Zero on success, Linux error code on failure
*4882a593Smuzhiyun */
*4882a593Smuzhiyunint kbase_gpuprops_req_curr_config_update(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	if (WARN_ON(!kbdev))
*4882a593Smuzhiyun		return -EINVAL;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	kbdev->gpu_props.curr_config.update_needed = true;
*4882a593Smuzhiyun	return 0;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_gpuprops_get_props - Get the GPU configuration
*4882a593Smuzhiyun * @gpu_props: The &struct base_gpu_props structure
*4882a593Smuzhiyun * @kbdev: The &struct kbase_device structure for the device
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Fill the &struct base_gpu_props structure with values from the GPU
*4882a593Smuzhiyun * configuration registers. Only the raw properties are filled in this function.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Return: Zero on success, Linux error code on failure
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstatic int kbase_gpuprops_get_props(struct base_gpu_props * const gpu_props,
*4882a593Smuzhiyun	struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct kbase_gpuprops_regdump regdump;
*4882a593Smuzhiyun	int i;
*4882a593Smuzhiyun	int err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	KBASE_DEBUG_ASSERT(kbdev != NULL);
*4882a593Smuzhiyun	KBASE_DEBUG_ASSERT(gpu_props != NULL);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Dump relevant registers */
*4882a593Smuzhiyun	err = kbase_backend_gpuprops_get(kbdev, &regdump);
*4882a593Smuzhiyun	if (err)
*4882a593Smuzhiyun		return err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->raw_props.gpu_id = regdump.gpu_id;
*4882a593Smuzhiyun	gpu_props->raw_props.tiler_features = regdump.tiler_features;
*4882a593Smuzhiyun	gpu_props->raw_props.mem_features = regdump.mem_features;
*4882a593Smuzhiyun	gpu_props->raw_props.mmu_features = regdump.mmu_features;
*4882a593Smuzhiyun	gpu_props->raw_props.l2_features = regdump.l2_features;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->raw_props.as_present = regdump.as_present;
*4882a593Smuzhiyun	gpu_props->raw_props.js_present = regdump.js_present;
*4882a593Smuzhiyun	gpu_props->raw_props.shader_present =
*4882a593Smuzhiyun		((u64) regdump.shader_present_hi << 32) +
*4882a593Smuzhiyun		regdump.shader_present_lo;
*4882a593Smuzhiyun	gpu_props->raw_props.tiler_present =
*4882a593Smuzhiyun		((u64) regdump.tiler_present_hi << 32) +
*4882a593Smuzhiyun		regdump.tiler_present_lo;
*4882a593Smuzhiyun	gpu_props->raw_props.l2_present =
*4882a593Smuzhiyun		((u64) regdump.l2_present_hi << 32) +
*4882a593Smuzhiyun		regdump.l2_present_lo;
*4882a593Smuzhiyun	gpu_props->raw_props.stack_present =
*4882a593Smuzhiyun		((u64) regdump.stack_present_hi << 32) +
*4882a593Smuzhiyun		regdump.stack_present_lo;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	for (i = 0; i < GPU_MAX_JOB_SLOTS; i++)
*4882a593Smuzhiyun		gpu_props->raw_props.js_features[i] = regdump.js_features[i];
*4882a593Smuzhiyun
*4882a593Smuzhiyun	for (i = 0; i < BASE_GPU_NUM_TEXTURE_FEATURES_REGISTERS; i++)
*4882a593Smuzhiyun		gpu_props->raw_props.texture_features[i] = regdump.texture_features[i];
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->raw_props.thread_max_barrier_size = regdump.thread_max_barrier_size;
*4882a593Smuzhiyun	gpu_props->raw_props.thread_max_threads = regdump.thread_max_threads;
*4882a593Smuzhiyun	gpu_props->raw_props.thread_max_workgroup_size = regdump.thread_max_workgroup_size;
*4882a593Smuzhiyun	gpu_props->raw_props.thread_features = regdump.thread_features;
*4882a593Smuzhiyun	gpu_props->raw_props.thread_tls_alloc = regdump.thread_tls_alloc;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->raw_props.gpu_features =
*4882a593Smuzhiyun		((u64) regdump.gpu_features_hi << 32) +
*4882a593Smuzhiyun		regdump.gpu_features_lo;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return 0;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid kbase_gpuprops_update_core_props_gpu_id(
*4882a593Smuzhiyun	struct base_gpu_props * const gpu_props)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	gpu_props->core_props.version_status =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.gpu_id, 0U, 4);
*4882a593Smuzhiyun	gpu_props->core_props.minor_revision =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.gpu_id, 4U, 8);
*4882a593Smuzhiyun	gpu_props->core_props.major_revision =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.gpu_id, 12U, 4);
*4882a593Smuzhiyun	gpu_props->core_props.product_id =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.gpu_id, 16U, 16);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_gpuprops_update_max_config_props - Updates the max config properties in
*4882a593Smuzhiyun * the base_gpu_props.
*4882a593Smuzhiyun * @base_props: The &struct base_gpu_props structure
*4882a593Smuzhiyun * @kbdev:      The &struct kbase_device structure for the device
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Updates the &struct base_gpu_props structure with the max config properties.
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstatic void kbase_gpuprops_update_max_config_props(
*4882a593Smuzhiyun	struct base_gpu_props * const base_props, struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	int l2_n = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (WARN_ON(!kbdev) || WARN_ON(!base_props))
*4882a593Smuzhiyun		return;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* return if the max_config is not set during arbif initialization */
*4882a593Smuzhiyun	if (kbdev->gpu_props.max_config.core_mask == 0)
*4882a593Smuzhiyun		return;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * Set the base_props with the maximum config values to ensure that the
*4882a593Smuzhiyun	 * user space will always be based on the maximum resources available.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	base_props->l2_props.num_l2_slices =
*4882a593Smuzhiyun		kbdev->gpu_props.max_config.l2_slices;
*4882a593Smuzhiyun	base_props->raw_props.shader_present =
*4882a593Smuzhiyun		kbdev->gpu_props.max_config.core_mask;
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * Update l2_present in the raw data to be consistent with the
*4882a593Smuzhiyun	 * max_config.l2_slices number.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	base_props->raw_props.l2_present = 0;
*4882a593Smuzhiyun	for (l2_n = 0; l2_n < base_props->l2_props.num_l2_slices; l2_n++) {
*4882a593Smuzhiyun		base_props->raw_props.l2_present <<= 1;
*4882a593Smuzhiyun		base_props->raw_props.l2_present |= 0x1;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * Update the coherency_info data using just one core group. For
*4882a593Smuzhiyun	 * architectures where the max_config is provided by the arbiter it is
*4882a593Smuzhiyun	 * not necessary to split the shader core groups in different coherent
*4882a593Smuzhiyun	 * groups.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	base_props->coherency_info.coherency =
*4882a593Smuzhiyun		base_props->raw_props.mem_features;
*4882a593Smuzhiyun	base_props->coherency_info.num_core_groups = 1;
*4882a593Smuzhiyun	base_props->coherency_info.num_groups = 1;
*4882a593Smuzhiyun	base_props->coherency_info.group[0].core_mask =
*4882a593Smuzhiyun		kbdev->gpu_props.max_config.core_mask;
*4882a593Smuzhiyun	base_props->coherency_info.group[0].num_cores =
*4882a593Smuzhiyun		hweight32(kbdev->gpu_props.max_config.core_mask);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_gpuprops_calculate_props - Calculate the derived properties
*4882a593Smuzhiyun * @gpu_props: The &struct base_gpu_props structure
*4882a593Smuzhiyun * @kbdev:     The &struct kbase_device structure for the device
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Fill the &struct base_gpu_props structure with values derived from the GPU
*4882a593Smuzhiyun * configuration registers
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstatic void kbase_gpuprops_calculate_props(
*4882a593Smuzhiyun	struct base_gpu_props * const gpu_props, struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	int i;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Populate the base_gpu_props structure */
*4882a593Smuzhiyun	kbase_gpuprops_update_core_props_gpu_id(gpu_props);
*4882a593Smuzhiyun	gpu_props->core_props.log2_program_counter_size = KBASE_GPU_PC_SIZE_LOG2;
*4882a593Smuzhiyun#if KERNEL_VERSION(5, 0, 0) > LINUX_VERSION_CODE
*4882a593Smuzhiyun	gpu_props->core_props.gpu_available_memory_size = totalram_pages << PAGE_SHIFT;
*4882a593Smuzhiyun#else
*4882a593Smuzhiyun	gpu_props->core_props.gpu_available_memory_size =
*4882a593Smuzhiyun		totalram_pages() << PAGE_SHIFT;
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun	for (i = 0; i < BASE_GPU_NUM_TEXTURE_FEATURES_REGISTERS; i++)
*4882a593Smuzhiyun		gpu_props->core_props.texture_features[i] = gpu_props->raw_props.texture_features[i];
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->l2_props.log2_line_size = KBASE_UBFX32(gpu_props->raw_props.l2_features, 0U, 8);
*4882a593Smuzhiyun	gpu_props->l2_props.log2_cache_size = KBASE_UBFX32(gpu_props->raw_props.l2_features, 16U, 8);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Field with number of l2 slices is added to MEM_FEATURES register
*4882a593Smuzhiyun	 * since t76x. Below code assumes that for older GPU reserved bits will
*4882a593Smuzhiyun	 * be read as zero.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	gpu_props->l2_props.num_l2_slices =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.mem_features, 8U, 4) + 1;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->tiler_props.bin_size_bytes = 1 << KBASE_UBFX32(gpu_props->raw_props.tiler_features, 0U, 6);
*4882a593Smuzhiyun	gpu_props->tiler_props.max_active_levels = KBASE_UBFX32(gpu_props->raw_props.tiler_features, 8U, 4);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (gpu_props->raw_props.thread_max_threads == 0)
*4882a593Smuzhiyun		gpu_props->thread_props.max_threads = THREAD_MT_DEFAULT;
*4882a593Smuzhiyun	else
*4882a593Smuzhiyun		gpu_props->thread_props.max_threads = gpu_props->raw_props.thread_max_threads;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (gpu_props->raw_props.thread_max_workgroup_size == 0)
*4882a593Smuzhiyun		gpu_props->thread_props.max_workgroup_size = THREAD_MWS_DEFAULT;
*4882a593Smuzhiyun	else
*4882a593Smuzhiyun		gpu_props->thread_props.max_workgroup_size = gpu_props->raw_props.thread_max_workgroup_size;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (gpu_props->raw_props.thread_max_barrier_size == 0)
*4882a593Smuzhiyun		gpu_props->thread_props.max_barrier_size = THREAD_MBS_DEFAULT;
*4882a593Smuzhiyun	else
*4882a593Smuzhiyun		gpu_props->thread_props.max_barrier_size = gpu_props->raw_props.thread_max_barrier_size;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (gpu_props->raw_props.thread_tls_alloc == 0)
*4882a593Smuzhiyun		gpu_props->thread_props.tls_alloc =
*4882a593Smuzhiyun				gpu_props->thread_props.max_threads;
*4882a593Smuzhiyun	else
*4882a593Smuzhiyun		gpu_props->thread_props.tls_alloc =
*4882a593Smuzhiyun				gpu_props->raw_props.thread_tls_alloc;
*4882a593Smuzhiyun
*4882a593Smuzhiyun#if MALI_USE_CSF
*4882a593Smuzhiyun	gpu_props->thread_props.max_registers =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 0U, 22);
*4882a593Smuzhiyun	gpu_props->thread_props.impl_tech =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 22U, 2);
*4882a593Smuzhiyun	gpu_props->thread_props.max_task_queue =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 24U, 8);
*4882a593Smuzhiyun	gpu_props->thread_props.max_thread_group_split = 0;
*4882a593Smuzhiyun#else
*4882a593Smuzhiyun	gpu_props->thread_props.max_registers =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 0U, 16);
*4882a593Smuzhiyun	gpu_props->thread_props.max_task_queue =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 16U, 8);
*4882a593Smuzhiyun	gpu_props->thread_props.max_thread_group_split =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 24U, 6);
*4882a593Smuzhiyun	gpu_props->thread_props.impl_tech =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.thread_features, 30U, 2);
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* If values are not specified, then use defaults */
*4882a593Smuzhiyun	if (gpu_props->thread_props.max_registers == 0) {
*4882a593Smuzhiyun		gpu_props->thread_props.max_registers = THREAD_MR_DEFAULT;
*4882a593Smuzhiyun		gpu_props->thread_props.max_task_queue = THREAD_MTQ_DEFAULT;
*4882a593Smuzhiyun		gpu_props->thread_props.max_thread_group_split = THREAD_MTGS_DEFAULT;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * If the maximum resources allocated information is available it is
*4882a593Smuzhiyun	 * necessary to update the base_gpu_props with the max_config info to
*4882a593Smuzhiyun	 * the userspace. This is applicable to systems that receive this
*4882a593Smuzhiyun	 * information from the arbiter.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	if (kbdev->gpu_props.max_config.core_mask)
*4882a593Smuzhiyun		/* Update the max config properties in the base_gpu_props */
*4882a593Smuzhiyun		kbase_gpuprops_update_max_config_props(gpu_props,
*4882a593Smuzhiyun						       kbdev);
*4882a593Smuzhiyun	else
*4882a593Smuzhiyun		/* Initialize the coherent_group structure for each group */
*4882a593Smuzhiyun		kbase_gpuprops_construct_coherent_groups(gpu_props);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid kbase_gpuprops_set_max_config(struct kbase_device *kbdev,
*4882a593Smuzhiyun	const struct max_config_props *max_config)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	if (WARN_ON(!kbdev) || WARN_ON(!max_config))
*4882a593Smuzhiyun		return;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	kbdev->gpu_props.max_config.l2_slices = max_config->l2_slices;
*4882a593Smuzhiyun	kbdev->gpu_props.max_config.core_mask = max_config->core_mask;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid kbase_gpuprops_set(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct kbase_gpu_props *gpu_props;
*4882a593Smuzhiyun	struct gpu_raw_gpu_props *raw;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (WARN_ON(!kbdev))
*4882a593Smuzhiyun		return;
*4882a593Smuzhiyun	gpu_props = &kbdev->gpu_props;
*4882a593Smuzhiyun	raw = &gpu_props->props.raw_props;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Initialize the base_gpu_props structure from the hardware */
*4882a593Smuzhiyun	kbase_gpuprops_get_props(&gpu_props->props, kbdev);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Populate the derived properties */
*4882a593Smuzhiyun	kbase_gpuprops_calculate_props(&gpu_props->props, kbdev);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Populate kbase-only fields */
*4882a593Smuzhiyun	gpu_props->l2_props.associativity = KBASE_UBFX32(raw->l2_features, 8U, 8);
*4882a593Smuzhiyun	gpu_props->l2_props.external_bus_width = KBASE_UBFX32(raw->l2_features, 24U, 8);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->mem.core_group = KBASE_UBFX32(raw->mem_features, 0U, 1);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->mmu.va_bits = KBASE_UBFX32(raw->mmu_features, 0U, 8);
*4882a593Smuzhiyun	gpu_props->mmu.pa_bits = KBASE_UBFX32(raw->mmu_features, 8U, 8);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props->num_cores = hweight64(raw->shader_present);
*4882a593Smuzhiyun	gpu_props->num_core_groups =
*4882a593Smuzhiyun		gpu_props->props.coherency_info.num_core_groups;
*4882a593Smuzhiyun	gpu_props->num_address_spaces = hweight32(raw->as_present);
*4882a593Smuzhiyun	gpu_props->num_job_slots = hweight32(raw->js_present);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * Current configuration is used on HW interactions so that the maximum
*4882a593Smuzhiyun	 * config is just used for user space avoiding interactions with parts
*4882a593Smuzhiyun	 * of the hardware that might not be allocated to the kbase instance at
*4882a593Smuzhiyun	 * that moment.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	kbase_gpuprops_req_curr_config_update(kbdev);
*4882a593Smuzhiyun	kbase_gpuprops_get_curr_config_props(kbdev, &gpu_props->curr_config);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunint kbase_gpuprops_set_features(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct base_gpu_props *gpu_props;
*4882a593Smuzhiyun	struct kbase_gpuprops_regdump regdump;
*4882a593Smuzhiyun	int err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	gpu_props = &kbdev->gpu_props.props;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Dump relevant registers */
*4882a593Smuzhiyun	err = kbase_backend_gpuprops_get_features(kbdev, &regdump);
*4882a593Smuzhiyun	if (err)
*4882a593Smuzhiyun		return err;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * Copy the raw value from the register, later this will get turned
*4882a593Smuzhiyun	 * into the selected coherency mode.
*4882a593Smuzhiyun	 * Additionally, add non-coherent mode, as this is always supported.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	gpu_props->raw_props.coherency_mode = regdump.coherency_features |
*4882a593Smuzhiyun		COHERENCY_FEATURE_BIT(COHERENCY_NONE);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (!kbase_hw_has_feature(kbdev, BASE_HW_FEATURE_THREAD_GROUP_SPLIT))
*4882a593Smuzhiyun		gpu_props->thread_props.max_thread_group_split = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/*
*4882a593Smuzhiyun	 * The CORE_FEATURES register has different meanings depending on GPU.
*4882a593Smuzhiyun	 * On tGOx, bits[3:0] encode num_exec_engines.
*4882a593Smuzhiyun	 * On CSF GPUs, bits[7:0] is an enumeration that needs to be parsed,
*4882a593Smuzhiyun	 * instead.
*4882a593Smuzhiyun	 * GPUs like tTIx have additional fields like LSC_SIZE that are
*4882a593Smuzhiyun	 * otherwise reserved/RAZ on older GPUs.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	gpu_props->raw_props.core_features = regdump.core_features;
*4882a593Smuzhiyun
*4882a593Smuzhiyun#if !MALI_USE_CSF
*4882a593Smuzhiyun	gpu_props->core_props.num_exec_engines =
*4882a593Smuzhiyun		KBASE_UBFX32(gpu_props->raw_props.core_features, 0, 4);
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return err;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyun/*
*4882a593Smuzhiyun * Module parameters to allow the L2 size and hash configuration to be
*4882a593Smuzhiyun * overridden.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * These parameters must be set on insmod to take effect, and are not visible
*4882a593Smuzhiyun * in sysfs.
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstatic u8 override_l2_size;
*4882a593Smuzhiyunmodule_param(override_l2_size, byte, 0000);
*4882a593SmuzhiyunMODULE_PARM_DESC(override_l2_size, "Override L2 size config for testing");
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic u8 override_l2_hash;
*4882a593Smuzhiyunmodule_param(override_l2_hash, byte, 0000);
*4882a593SmuzhiyunMODULE_PARM_DESC(override_l2_hash, "Override L2 hash config for testing");
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic u32 l2_hash_values[ASN_HASH_COUNT] = {
*4882a593Smuzhiyun	0,
*4882a593Smuzhiyun};
*4882a593Smuzhiyunstatic unsigned int num_override_l2_hash_values;
*4882a593Smuzhiyunmodule_param_array(l2_hash_values, uint, &num_override_l2_hash_values, 0000);
*4882a593SmuzhiyunMODULE_PARM_DESC(l2_hash_values, "Override L2 hash values config for testing");
*4882a593Smuzhiyun
*4882a593Smuzhiyun/* Definitions for range of supported user defined hash functions for GPUs
*4882a593Smuzhiyun * that support L2_CONFIG and not ASN_HASH features. Supported hash function
*4882a593Smuzhiyun * range from 0b1000-0b1111 inclusive. Selection of any other values will
*4882a593Smuzhiyun * lead to undefined behavior.
*4882a593Smuzhiyun */
*4882a593Smuzhiyun#define USER_DEFINED_HASH_LO ((u8)0x08)
*4882a593Smuzhiyun#define USER_DEFINED_HASH_HI ((u8)0x0F)
*4882a593Smuzhiyun
*4882a593Smuzhiyunenum l2_config_override_result {
*4882a593Smuzhiyun	L2_CONFIG_OVERRIDE_FAIL = -1,
*4882a593Smuzhiyun	L2_CONFIG_OVERRIDE_NONE,
*4882a593Smuzhiyun	L2_CONFIG_OVERRIDE_OK,
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyun/**
*4882a593Smuzhiyun * kbase_read_l2_config_from_dt - Read L2 configuration
*4882a593Smuzhiyun * @kbdev: The kbase device for which to get the L2 configuration.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Check for L2 configuration overrides in module parameters and device tree.
*4882a593Smuzhiyun * Override values in module parameters take priority over override values in
*4882a593Smuzhiyun * device tree.
*4882a593Smuzhiyun *
*4882a593Smuzhiyun * Return: L2_CONFIG_OVERRIDE_OK if either size or hash, or both was properly
*4882a593Smuzhiyun *         overridden, L2_CONFIG_OVERRIDE_NONE if no overrides are provided.
*4882a593Smuzhiyun *         L2_CONFIG_OVERRIDE_FAIL otherwise.
*4882a593Smuzhiyun */
*4882a593Smuzhiyunstatic enum l2_config_override_result
*4882a593Smuzhiyunkbase_read_l2_config_from_dt(struct kbase_device *const kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct device_node *np = kbdev->dev->of_node;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (!np)
*4882a593Smuzhiyun		return L2_CONFIG_OVERRIDE_NONE;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (override_l2_size)
*4882a593Smuzhiyun		kbdev->l2_size_override = override_l2_size;
*4882a593Smuzhiyun	else if (of_property_read_u8(np, "l2-size", &kbdev->l2_size_override))
*4882a593Smuzhiyun		kbdev->l2_size_override = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* Check overriding value is supported, if not will result in
*4882a593Smuzhiyun	 * undefined behavior.
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	if (override_l2_hash >= USER_DEFINED_HASH_LO &&
*4882a593Smuzhiyun	    override_l2_hash <= USER_DEFINED_HASH_HI)
*4882a593Smuzhiyun		kbdev->l2_hash_override = override_l2_hash;
*4882a593Smuzhiyun	else if (of_property_read_u8(np, "l2-hash", &kbdev->l2_hash_override))
*4882a593Smuzhiyun		kbdev->l2_hash_override = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	kbdev->l2_hash_values_override = false;
*4882a593Smuzhiyun	if (num_override_l2_hash_values) {
*4882a593Smuzhiyun		unsigned int i;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		kbdev->l2_hash_values_override = true;
*4882a593Smuzhiyun		for (i = 0; i < num_override_l2_hash_values; i++)
*4882a593Smuzhiyun			kbdev->l2_hash_values[i] = l2_hash_values[i];
*4882a593Smuzhiyun	} else if (!of_property_read_u32_array(np, "l2-hash-values",
*4882a593Smuzhiyun					       kbdev->l2_hash_values,
*4882a593Smuzhiyun					       ASN_HASH_COUNT))
*4882a593Smuzhiyun		kbdev->l2_hash_values_override = true;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (kbase_hw_has_feature(kbdev, BASE_HW_FEATURE_ASN_HASH) &&
*4882a593Smuzhiyun	    (kbdev->l2_hash_override)) {
*4882a593Smuzhiyun		dev_err(kbdev->dev, "l2-hash not supported\n");
*4882a593Smuzhiyun		return L2_CONFIG_OVERRIDE_FAIL;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (!kbase_hw_has_feature(kbdev, BASE_HW_FEATURE_ASN_HASH) &&
*4882a593Smuzhiyun	    (kbdev->l2_hash_values_override)) {
*4882a593Smuzhiyun		dev_err(kbdev->dev, "l2-hash-values not supported\n");
*4882a593Smuzhiyun		return L2_CONFIG_OVERRIDE_FAIL;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (kbdev->l2_hash_override && kbdev->l2_hash_values_override) {
*4882a593Smuzhiyun		dev_err(kbdev->dev,
*4882a593Smuzhiyun			"both l2-hash & l2-hash-values not supported\n");
*4882a593Smuzhiyun		return L2_CONFIG_OVERRIDE_FAIL;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (kbdev->l2_size_override || kbdev->l2_hash_override ||
*4882a593Smuzhiyun	    kbdev->l2_hash_values_override)
*4882a593Smuzhiyun		return L2_CONFIG_OVERRIDE_OK;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return L2_CONFIG_OVERRIDE_NONE;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunint kbase_gpuprops_update_l2_features(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	int err = 0;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (kbase_hw_has_feature(kbdev, BASE_HW_FEATURE_L2_CONFIG)) {
*4882a593Smuzhiyun		struct kbase_gpuprops_regdump regdump;
*4882a593Smuzhiyun		struct base_gpu_props *gpu_props = &kbdev->gpu_props.props;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Check for L2 cache size & hash overrides */
*4882a593Smuzhiyun		switch (kbase_read_l2_config_from_dt(kbdev)) {
*4882a593Smuzhiyun		case L2_CONFIG_OVERRIDE_FAIL:
*4882a593Smuzhiyun			err = -EIO;
*4882a593Smuzhiyun			goto exit;
*4882a593Smuzhiyun		case L2_CONFIG_OVERRIDE_NONE:
*4882a593Smuzhiyun			goto exit;
*4882a593Smuzhiyun		default:
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		}
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* pm.active_count is expected to be 1 here, which is set in
*4882a593Smuzhiyun		 * kbase_hwaccess_pm_powerup().
*4882a593Smuzhiyun		 */
*4882a593Smuzhiyun		WARN_ON(kbdev->pm.active_count != 1);
*4882a593Smuzhiyun		/* The new settings for L2 cache can only be applied when it is
*4882a593Smuzhiyun		 * off, so first do the power down.
*4882a593Smuzhiyun		 */
*4882a593Smuzhiyun		kbase_pm_context_idle(kbdev);
*4882a593Smuzhiyun		kbase_pm_wait_for_desired_state(kbdev);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Need L2 to get powered to reflect to L2_FEATURES */
*4882a593Smuzhiyun		kbase_pm_context_active(kbdev);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Wait for the completion of L2 power transition */
*4882a593Smuzhiyun		kbase_pm_wait_for_l2_powered(kbdev);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Dump L2_FEATURES register */
*4882a593Smuzhiyun		err = kbase_backend_gpuprops_get_l2_features(kbdev, &regdump);
*4882a593Smuzhiyun		if (err)
*4882a593Smuzhiyun			goto exit;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		dev_info(kbdev->dev, "Reflected L2_FEATURES is 0x%x\n",
*4882a593Smuzhiyun			 regdump.l2_features);
*4882a593Smuzhiyun		dev_info(kbdev->dev, "Reflected L2_CONFIG is 0x%08x\n",
*4882a593Smuzhiyun			 regdump.l2_config);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		if (kbase_hw_has_feature(kbdev, BASE_HW_FEATURE_ASN_HASH)) {
*4882a593Smuzhiyun			int idx;
*4882a593Smuzhiyun			const bool asn_he = regdump.l2_config &
*4882a593Smuzhiyun					    L2_CONFIG_ASN_HASH_ENABLE_MASK;
*4882a593Smuzhiyun#if !IS_ENABLED(CONFIG_MALI_BIFROST_NO_MALI)
*4882a593Smuzhiyun			if (!asn_he && kbdev->l2_hash_values_override)
*4882a593Smuzhiyun				dev_err(kbdev->dev,
*4882a593Smuzhiyun					"Failed to use requested ASN_HASH, fallback to default");
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun			for (idx = 0; idx < ASN_HASH_COUNT; idx++)
*4882a593Smuzhiyun				dev_info(kbdev->dev,
*4882a593Smuzhiyun					 "%s ASN_HASH[%d] is [0x%08x]\n",
*4882a593Smuzhiyun					 asn_he ? "Overridden" : "Default", idx,
*4882a593Smuzhiyun					 regdump.l2_asn_hash[idx]);
*4882a593Smuzhiyun		}
*4882a593Smuzhiyun
*4882a593Smuzhiyun		/* Update gpuprops with reflected L2_FEATURES */
*4882a593Smuzhiyun		gpu_props->raw_props.l2_features = regdump.l2_features;
*4882a593Smuzhiyun		gpu_props->l2_props.log2_cache_size =
*4882a593Smuzhiyun			KBASE_UBFX32(gpu_props->raw_props.l2_features, 16U, 8);
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyunexit:
*4882a593Smuzhiyun	return err;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunstatic struct {
*4882a593Smuzhiyun	u32 type;
*4882a593Smuzhiyun	size_t offset;
*4882a593Smuzhiyun	int size;
*4882a593Smuzhiyun} gpu_property_mapping[] = {
*4882a593Smuzhiyun#define PROP(name, member) \
*4882a593Smuzhiyun	{KBASE_GPUPROP_ ## name, offsetof(struct base_gpu_props, member), \
*4882a593Smuzhiyun		sizeof(((struct base_gpu_props *)0)->member)}
*4882a593Smuzhiyun	PROP(PRODUCT_ID, core_props.product_id),
*4882a593Smuzhiyun	PROP(VERSION_STATUS, core_props.version_status),
*4882a593Smuzhiyun	PROP(MINOR_REVISION, core_props.minor_revision),
*4882a593Smuzhiyun	PROP(MAJOR_REVISION, core_props.major_revision),
*4882a593Smuzhiyun	PROP(GPU_FREQ_KHZ_MAX, core_props.gpu_freq_khz_max),
*4882a593Smuzhiyun	PROP(LOG2_PROGRAM_COUNTER_SIZE, core_props.log2_program_counter_size),
*4882a593Smuzhiyun	PROP(TEXTURE_FEATURES_0, core_props.texture_features[0]),
*4882a593Smuzhiyun	PROP(TEXTURE_FEATURES_1, core_props.texture_features[1]),
*4882a593Smuzhiyun	PROP(TEXTURE_FEATURES_2, core_props.texture_features[2]),
*4882a593Smuzhiyun	PROP(TEXTURE_FEATURES_3, core_props.texture_features[3]),
*4882a593Smuzhiyun	PROP(GPU_AVAILABLE_MEMORY_SIZE, core_props.gpu_available_memory_size),
*4882a593Smuzhiyun
*4882a593Smuzhiyun#if MALI_USE_CSF
*4882a593Smuzhiyun#define BACKWARDS_COMPAT_PROP(name, type)                                                          \
*4882a593Smuzhiyun	{                                                                                          \
*4882a593Smuzhiyun		KBASE_GPUPROP_##name, SIZE_MAX, sizeof(type)                                       \
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun	BACKWARDS_COMPAT_PROP(NUM_EXEC_ENGINES, u8),
*4882a593Smuzhiyun#else
*4882a593Smuzhiyun	PROP(NUM_EXEC_ENGINES, core_props.num_exec_engines),
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun	PROP(L2_LOG2_LINE_SIZE, l2_props.log2_line_size),
*4882a593Smuzhiyun	PROP(L2_LOG2_CACHE_SIZE, l2_props.log2_cache_size),
*4882a593Smuzhiyun	PROP(L2_NUM_L2_SLICES, l2_props.num_l2_slices),
*4882a593Smuzhiyun
*4882a593Smuzhiyun	PROP(TILER_BIN_SIZE_BYTES, tiler_props.bin_size_bytes),
*4882a593Smuzhiyun	PROP(TILER_MAX_ACTIVE_LEVELS, tiler_props.max_active_levels),
*4882a593Smuzhiyun
*4882a593Smuzhiyun	PROP(MAX_THREADS, thread_props.max_threads),
*4882a593Smuzhiyun	PROP(MAX_WORKGROUP_SIZE, thread_props.max_workgroup_size),
*4882a593Smuzhiyun	PROP(MAX_BARRIER_SIZE, thread_props.max_barrier_size),
*4882a593Smuzhiyun	PROP(MAX_REGISTERS, thread_props.max_registers),
*4882a593Smuzhiyun	PROP(MAX_TASK_QUEUE, thread_props.max_task_queue),
*4882a593Smuzhiyun	PROP(MAX_THREAD_GROUP_SPLIT, thread_props.max_thread_group_split),
*4882a593Smuzhiyun	PROP(IMPL_TECH, thread_props.impl_tech),
*4882a593Smuzhiyun	PROP(TLS_ALLOC, thread_props.tls_alloc),
*4882a593Smuzhiyun
*4882a593Smuzhiyun	PROP(RAW_SHADER_PRESENT, raw_props.shader_present),
*4882a593Smuzhiyun	PROP(RAW_TILER_PRESENT, raw_props.tiler_present),
*4882a593Smuzhiyun	PROP(RAW_L2_PRESENT, raw_props.l2_present),
*4882a593Smuzhiyun	PROP(RAW_STACK_PRESENT, raw_props.stack_present),
*4882a593Smuzhiyun	PROP(RAW_L2_FEATURES, raw_props.l2_features),
*4882a593Smuzhiyun	PROP(RAW_CORE_FEATURES, raw_props.core_features),
*4882a593Smuzhiyun	PROP(RAW_MEM_FEATURES, raw_props.mem_features),
*4882a593Smuzhiyun	PROP(RAW_MMU_FEATURES, raw_props.mmu_features),
*4882a593Smuzhiyun	PROP(RAW_AS_PRESENT, raw_props.as_present),
*4882a593Smuzhiyun	PROP(RAW_JS_PRESENT, raw_props.js_present),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_0, raw_props.js_features[0]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_1, raw_props.js_features[1]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_2, raw_props.js_features[2]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_3, raw_props.js_features[3]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_4, raw_props.js_features[4]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_5, raw_props.js_features[5]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_6, raw_props.js_features[6]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_7, raw_props.js_features[7]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_8, raw_props.js_features[8]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_9, raw_props.js_features[9]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_10, raw_props.js_features[10]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_11, raw_props.js_features[11]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_12, raw_props.js_features[12]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_13, raw_props.js_features[13]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_14, raw_props.js_features[14]),
*4882a593Smuzhiyun	PROP(RAW_JS_FEATURES_15, raw_props.js_features[15]),
*4882a593Smuzhiyun	PROP(RAW_TILER_FEATURES, raw_props.tiler_features),
*4882a593Smuzhiyun	PROP(RAW_TEXTURE_FEATURES_0, raw_props.texture_features[0]),
*4882a593Smuzhiyun	PROP(RAW_TEXTURE_FEATURES_1, raw_props.texture_features[1]),
*4882a593Smuzhiyun	PROP(RAW_TEXTURE_FEATURES_2, raw_props.texture_features[2]),
*4882a593Smuzhiyun	PROP(RAW_TEXTURE_FEATURES_3, raw_props.texture_features[3]),
*4882a593Smuzhiyun	PROP(RAW_GPU_ID, raw_props.gpu_id),
*4882a593Smuzhiyun	PROP(RAW_THREAD_MAX_THREADS, raw_props.thread_max_threads),
*4882a593Smuzhiyun	PROP(RAW_THREAD_MAX_WORKGROUP_SIZE, raw_props.thread_max_workgroup_size),
*4882a593Smuzhiyun	PROP(RAW_THREAD_MAX_BARRIER_SIZE, raw_props.thread_max_barrier_size),
*4882a593Smuzhiyun	PROP(RAW_THREAD_FEATURES, raw_props.thread_features),
*4882a593Smuzhiyun	PROP(RAW_COHERENCY_MODE, raw_props.coherency_mode),
*4882a593Smuzhiyun	PROP(RAW_THREAD_TLS_ALLOC, raw_props.thread_tls_alloc),
*4882a593Smuzhiyun	PROP(RAW_GPU_FEATURES, raw_props.gpu_features),
*4882a593Smuzhiyun	PROP(COHERENCY_NUM_GROUPS, coherency_info.num_groups),
*4882a593Smuzhiyun	PROP(COHERENCY_NUM_CORE_GROUPS, coherency_info.num_core_groups),
*4882a593Smuzhiyun	PROP(COHERENCY_COHERENCY, coherency_info.coherency),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_0, coherency_info.group[0].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_1, coherency_info.group[1].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_2, coherency_info.group[2].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_3, coherency_info.group[3].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_4, coherency_info.group[4].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_5, coherency_info.group[5].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_6, coherency_info.group[6].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_7, coherency_info.group[7].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_8, coherency_info.group[8].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_9, coherency_info.group[9].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_10, coherency_info.group[10].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_11, coherency_info.group[11].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_12, coherency_info.group[12].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_13, coherency_info.group[13].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_14, coherency_info.group[14].core_mask),
*4882a593Smuzhiyun	PROP(COHERENCY_GROUP_15, coherency_info.group[15].core_mask),
*4882a593Smuzhiyun
*4882a593Smuzhiyun#undef PROP
*4882a593Smuzhiyun};
*4882a593Smuzhiyun
*4882a593Smuzhiyunint kbase_gpuprops_populate_user_buffer(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct kbase_gpu_props *kprops = &kbdev->gpu_props;
*4882a593Smuzhiyun	struct base_gpu_props *props = &kprops->props;
*4882a593Smuzhiyun	u32 count = ARRAY_SIZE(gpu_property_mapping);
*4882a593Smuzhiyun	u32 i;
*4882a593Smuzhiyun	u32 size = 0;
*4882a593Smuzhiyun	u8 *p;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	for (i = 0; i < count; i++) {
*4882a593Smuzhiyun		/* 4 bytes for the ID, and the size of the property */
*4882a593Smuzhiyun		size += 4 + gpu_property_mapping[i].size;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	kprops->prop_buffer_size = size;
*4882a593Smuzhiyun	kprops->prop_buffer = kzalloc(size, GFP_KERNEL);
*4882a593Smuzhiyun
*4882a593Smuzhiyun	if (!kprops->prop_buffer) {
*4882a593Smuzhiyun		kprops->prop_buffer_size = 0;
*4882a593Smuzhiyun		return -ENOMEM;
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	p = kprops->prop_buffer;
*4882a593Smuzhiyun
*4882a593Smuzhiyun#define WRITE_U8(v) (*p++ = (v) & 0xFF)
*4882a593Smuzhiyun#define WRITE_U16(v) do { WRITE_U8(v); WRITE_U8((v) >> 8); } while (0)
*4882a593Smuzhiyun#define WRITE_U32(v) do { WRITE_U16(v); WRITE_U16((v) >> 16); } while (0)
*4882a593Smuzhiyun#define WRITE_U64(v) do { WRITE_U32(v); WRITE_U32((v) >> 32); } while (0)
*4882a593Smuzhiyun
*4882a593Smuzhiyun	for (i = 0; i < count; i++) {
*4882a593Smuzhiyun		u32 type = gpu_property_mapping[i].type;
*4882a593Smuzhiyun		u8 type_size;
*4882a593Smuzhiyun		const size_t offset = gpu_property_mapping[i].offset;
*4882a593Smuzhiyun		const u64 dummy_backwards_compat_value = (u64)0;
*4882a593Smuzhiyun		const void *field;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		if (likely(offset < sizeof(struct base_gpu_props)))
*4882a593Smuzhiyun			field = ((const u8 *)props) + offset;
*4882a593Smuzhiyun		else
*4882a593Smuzhiyun			field = &dummy_backwards_compat_value;
*4882a593Smuzhiyun
*4882a593Smuzhiyun		switch (gpu_property_mapping[i].size) {
*4882a593Smuzhiyun		case 1:
*4882a593Smuzhiyun			type_size = KBASE_GPUPROP_VALUE_SIZE_U8;
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case 2:
*4882a593Smuzhiyun			type_size = KBASE_GPUPROP_VALUE_SIZE_U16;
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case 4:
*4882a593Smuzhiyun			type_size = KBASE_GPUPROP_VALUE_SIZE_U32;
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case 8:
*4882a593Smuzhiyun			type_size = KBASE_GPUPROP_VALUE_SIZE_U64;
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		default:
*4882a593Smuzhiyun			dev_err(kbdev->dev,
*4882a593Smuzhiyun				"Invalid gpu_property_mapping type=%d size=%d",
*4882a593Smuzhiyun				type, gpu_property_mapping[i].size);
*4882a593Smuzhiyun			return -EINVAL;
*4882a593Smuzhiyun		}
*4882a593Smuzhiyun
*4882a593Smuzhiyun		WRITE_U32((type<<2) | type_size);
*4882a593Smuzhiyun
*4882a593Smuzhiyun		switch (type_size) {
*4882a593Smuzhiyun		case KBASE_GPUPROP_VALUE_SIZE_U8:
*4882a593Smuzhiyun			WRITE_U8(*((const u8 *)field));
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case KBASE_GPUPROP_VALUE_SIZE_U16:
*4882a593Smuzhiyun			WRITE_U16(*((const u16 *)field));
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case KBASE_GPUPROP_VALUE_SIZE_U32:
*4882a593Smuzhiyun			WRITE_U32(*((const u32 *)field));
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		case KBASE_GPUPROP_VALUE_SIZE_U64:
*4882a593Smuzhiyun			WRITE_U64(*((const u64 *)field));
*4882a593Smuzhiyun			break;
*4882a593Smuzhiyun		default: /* Cannot be reached */
*4882a593Smuzhiyun			WARN_ON(1);
*4882a593Smuzhiyun			return -EINVAL;
*4882a593Smuzhiyun		}
*4882a593Smuzhiyun	}
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return 0;
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunvoid kbase_gpuprops_free_user_buffer(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	kfree(kbdev->gpu_props.prop_buffer);
*4882a593Smuzhiyun}
*4882a593Smuzhiyun
*4882a593Smuzhiyunint kbase_device_populate_max_freq(struct kbase_device *kbdev)
*4882a593Smuzhiyun{
*4882a593Smuzhiyun	struct mali_base_gpu_core_props *core_props;
*4882a593Smuzhiyun
*4882a593Smuzhiyun	/* obtain max configured gpu frequency, if devfreq is enabled then
*4882a593Smuzhiyun	 * this will be overridden by the highest operating point found
*4882a593Smuzhiyun	 */
*4882a593Smuzhiyun	core_props = &(kbdev->gpu_props.props.core_props);
*4882a593Smuzhiyun#ifdef GPU_FREQ_KHZ_MAX
*4882a593Smuzhiyun	core_props->gpu_freq_khz_max = GPU_FREQ_KHZ_MAX;
*4882a593Smuzhiyun#else
*4882a593Smuzhiyun	core_props->gpu_freq_khz_max = DEFAULT_GPU_FREQ_KHZ_MAX;
*4882a593Smuzhiyun#endif
*4882a593Smuzhiyun
*4882a593Smuzhiyun	return 0;
*4882a593Smuzhiyun}