1 // SPDX-License-Identifier: GPL-2.0-only OR MIT
2 /* Copyright (c) 2023 Imagination Technologies Ltd. */
4 #include "pvr_free_list.h"
7 #include "pvr_rogue_cr_defs_client.h"
8 #include "pvr_rogue_fwif.h"
10 #include <drm/drm_gem.h>
11 #include <linux/bitops.h>
12 #include <linux/math.h>
13 #include <linux/slab.h>
14 #include <linux/xarray.h>
15 #include <uapi/drm/pvr_drm.h>
17 static_assert(ROGUE_FWIF_NUM_RTDATAS == 2);
18 static_assert(ROGUE_FWIF_NUM_GEOMDATAS == 1);
19 static_assert(ROGUE_FWIF_NUM_RTDATA_FREELISTS == 2);
22 * struct pvr_rt_mtile_info - Render target macrotile information
24 struct pvr_rt_mtile_info {
35 /* Size of Shadow Render Target Cache entry */
36 #define SRTC_ENTRY_SIZE sizeof(u32)
37 /* Size of Renders Accumulation Array entry */
38 #define RAA_ENTRY_SIZE sizeof(u32)
41 hwrt_init_kernel_structure(struct pvr_file *pvr_file,
42 struct drm_pvr_ioctl_create_hwrt_dataset_args *args,
43 struct pvr_hwrt_dataset *hwrt)
45 struct pvr_device *pvr_dev = pvr_file->pvr_dev;
49 hwrt->pvr_dev = pvr_dev;
50 hwrt->max_rts = args->layers;
52 /* Get pointers to the free lists */
53 for (i = 0; i < ARRAY_SIZE(hwrt->free_lists); i++) {
54 hwrt->free_lists[i] = pvr_free_list_lookup(pvr_file, args->free_list_handles[i]);
55 if (!hwrt->free_lists[i]) {
57 goto err_put_free_lists;
61 if (hwrt->free_lists[ROGUE_FW_LOCAL_FREELIST]->current_pages <
62 pvr_get_free_list_min_pages(pvr_dev)) {
64 goto err_put_free_lists;
70 for (i = 0; i < ARRAY_SIZE(hwrt->free_lists); i++) {
71 pvr_free_list_put(hwrt->free_lists[i]);
72 hwrt->free_lists[i] = NULL;
79 hwrt_fini_kernel_structure(struct pvr_hwrt_dataset *hwrt)
83 for (i = 0; i < ARRAY_SIZE(hwrt->free_lists); i++) {
84 pvr_free_list_put(hwrt->free_lists[i]);
85 hwrt->free_lists[i] = NULL;
90 hwrt_fini_common_fw_structure(struct pvr_hwrt_dataset *hwrt)
92 pvr_fw_object_destroy(hwrt->common_fw_obj);
96 get_cr_isp_mtile_size_val(struct pvr_device *pvr_dev, u32 samples,
97 struct pvr_rt_mtile_info *info, u32 *value_out)
99 u32 x = info->mtile_x[0];
100 u32 y = info->mtile_y[0];
101 u32 samples_per_pixel;
104 err = PVR_FEATURE_VALUE(pvr_dev, isp_samples_per_pixel, &samples_per_pixel);
108 if (samples_per_pixel == 1) {
113 } else if (samples_per_pixel == 2) {
118 } else if (samples_per_pixel == 4) {
122 WARN(true, "Unsupported ISP samples per pixel value");
126 *value_out = ((x << ROGUE_CR_ISP_MTILE_SIZE_X_SHIFT) & ~ROGUE_CR_ISP_MTILE_SIZE_X_CLRMSK) |
127 ((y << ROGUE_CR_ISP_MTILE_SIZE_Y_SHIFT) & ~ROGUE_CR_ISP_MTILE_SIZE_Y_CLRMSK);
133 get_cr_multisamplectl_val(u32 samples, bool y_flip, u64 *value_out)
135 static const struct {
138 } sample_positions[4] = {
151 .x = { 6, 14, 2, 10 },
152 .y = { 2, 6, 10, 14 },
156 .x = { 9, 7, 13, 5, 3, 1, 11, 15 },
157 .y = { 5, 11, 9, 3, 13, 7, 15, 1 },
160 const int idx = fls(samples) - 1;
163 if (idx < 0 || idx > 3)
166 for (u32 i = 0; i < 8; i++) {
167 value |= ((u64)sample_positions[idx].x[i]) << (i * 8);
169 value |= (((u64)(16 - sample_positions[idx].y[i]) & 0xf)) << (i * 8 + 4);
171 value |= ((u64)sample_positions[idx].y[i]) << (i * 8 + 4);
180 get_cr_te_aa_val(struct pvr_device *pvr_dev, u32 samples, u32 *value_out)
182 u32 samples_per_pixel;
186 err = PVR_FEATURE_VALUE(pvr_dev, isp_samples_per_pixel, &samples_per_pixel);
190 switch (samples_per_pixel) {
193 value |= ROGUE_CR_TE_AA_Y_EN;
195 value |= ROGUE_CR_TE_AA_X_EN;
199 value |= ROGUE_CR_TE_AA_X2_EN;
201 value |= ROGUE_CR_TE_AA_Y_EN;
203 value |= ROGUE_CR_TE_AA_X_EN;
207 value |= ROGUE_CR_TE_AA_X2_EN;
209 value |= ROGUE_CR_TE_AA_Y2_EN;
211 value |= ROGUE_CR_TE_AA_Y_EN;
214 WARN(true, "Unsupported ISP samples per pixel value");
224 hwrtdata_common_init(void *cpu_ptr, void *priv)
226 struct pvr_hwrt_dataset *hwrt = priv;
228 memcpy(cpu_ptr, &hwrt->common, sizeof(hwrt->common));
232 hwrt_init_common_fw_structure(struct pvr_file *pvr_file,
233 struct drm_pvr_ioctl_create_hwrt_dataset_args *args,
234 struct pvr_hwrt_dataset *hwrt)
236 struct drm_pvr_create_hwrt_geom_data_args *geom_data_args = &args->geom_data_args;
237 struct pvr_device *pvr_dev = pvr_file->pvr_dev;
238 struct pvr_rt_mtile_info info;
241 err = PVR_FEATURE_VALUE(pvr_dev, tile_size_x, &info.tile_size_x);
245 err = PVR_FEATURE_VALUE(pvr_dev, tile_size_y, &info.tile_size_y);
249 info.num_tiles_x = DIV_ROUND_UP(args->width, info.tile_size_x);
250 info.num_tiles_y = DIV_ROUND_UP(args->height, info.tile_size_y);
252 if (PVR_HAS_FEATURE(pvr_dev, simple_parameter_format_version)) {
253 u32 parameter_format;
255 err = PVR_FEATURE_VALUE(pvr_dev, simple_parameter_format_version,
260 WARN_ON(parameter_format != 2);
263 * Set up 16 macrotiles with a multiple of 2x2 tiles per macrotile, which is
264 * aligned to a tile group.
266 info.mtile_x[0] = DIV_ROUND_UP(info.num_tiles_x, 8) * 2;
267 info.mtile_y[0] = DIV_ROUND_UP(info.num_tiles_y, 8) * 2;
272 info.tile_max_x = round_up(info.num_tiles_x, 2) - 1;
273 info.tile_max_y = round_up(info.num_tiles_y, 2) - 1;
275 /* Set up 16 macrotiles with a multiple of 4x4 tiles per macrotile. */
276 info.mtile_x[0] = round_up(DIV_ROUND_UP(info.num_tiles_x, 4), 4);
277 info.mtile_y[0] = round_up(DIV_ROUND_UP(info.num_tiles_y, 4), 4);
278 info.mtile_x[1] = info.mtile_x[0] * 2;
279 info.mtile_y[1] = info.mtile_y[0] * 2;
280 info.mtile_x[2] = info.mtile_x[0] * 3;
281 info.mtile_y[2] = info.mtile_y[0] * 3;
282 info.tile_max_x = info.num_tiles_x - 1;
283 info.tile_max_y = info.num_tiles_y - 1;
286 hwrt->common.geom_caches_need_zeroing = false;
288 hwrt->common.isp_merge_lower_x = args->isp_merge_lower_x;
289 hwrt->common.isp_merge_lower_y = args->isp_merge_lower_y;
290 hwrt->common.isp_merge_upper_x = args->isp_merge_upper_x;
291 hwrt->common.isp_merge_upper_y = args->isp_merge_upper_y;
292 hwrt->common.isp_merge_scale_x = args->isp_merge_scale_x;
293 hwrt->common.isp_merge_scale_y = args->isp_merge_scale_y;
295 err = get_cr_multisamplectl_val(args->samples, false,
296 &hwrt->common.multi_sample_ctl);
300 err = get_cr_multisamplectl_val(args->samples, true,
301 &hwrt->common.flipped_multi_sample_ctl);
305 hwrt->common.mtile_stride = info.mtile_x[0] * info.mtile_y[0];
307 err = get_cr_te_aa_val(pvr_dev, args->samples, &hwrt->common.teaa);
311 hwrt->common.screen_pixel_max =
312 (((args->width - 1) << ROGUE_CR_PPP_SCREEN_PIXXMAX_SHIFT) &
313 ~ROGUE_CR_PPP_SCREEN_PIXXMAX_CLRMSK) |
314 (((args->height - 1) << ROGUE_CR_PPP_SCREEN_PIXYMAX_SHIFT) &
315 ~ROGUE_CR_PPP_SCREEN_PIXYMAX_CLRMSK);
317 hwrt->common.te_screen =
318 ((info.tile_max_x << ROGUE_CR_TE_SCREEN_XMAX_SHIFT) &
319 ~ROGUE_CR_TE_SCREEN_XMAX_CLRMSK) |
320 ((info.tile_max_y << ROGUE_CR_TE_SCREEN_YMAX_SHIFT) &
321 ~ROGUE_CR_TE_SCREEN_YMAX_CLRMSK);
322 hwrt->common.te_mtile1 =
323 ((info.mtile_x[0] << ROGUE_CR_TE_MTILE1_X1_SHIFT) & ~ROGUE_CR_TE_MTILE1_X1_CLRMSK) |
324 ((info.mtile_x[1] << ROGUE_CR_TE_MTILE1_X2_SHIFT) & ~ROGUE_CR_TE_MTILE1_X2_CLRMSK) |
325 ((info.mtile_x[2] << ROGUE_CR_TE_MTILE1_X3_SHIFT) & ~ROGUE_CR_TE_MTILE1_X3_CLRMSK);
326 hwrt->common.te_mtile2 =
327 ((info.mtile_y[0] << ROGUE_CR_TE_MTILE2_Y1_SHIFT) & ~ROGUE_CR_TE_MTILE2_Y1_CLRMSK) |
328 ((info.mtile_y[1] << ROGUE_CR_TE_MTILE2_Y2_SHIFT) & ~ROGUE_CR_TE_MTILE2_Y2_CLRMSK) |
329 ((info.mtile_y[2] << ROGUE_CR_TE_MTILE2_Y3_SHIFT) & ~ROGUE_CR_TE_MTILE2_Y3_CLRMSK);
331 err = get_cr_isp_mtile_size_val(pvr_dev, args->samples, &info,
332 &hwrt->common.isp_mtile_size);
336 hwrt->common.tpc_stride = geom_data_args->tpc_stride;
337 hwrt->common.tpc_size = geom_data_args->tpc_size;
339 hwrt->common.rgn_header_size = args->region_header_size;
341 err = pvr_fw_object_create(pvr_dev, sizeof(struct rogue_fwif_hwrtdata_common),
342 PVR_BO_FW_FLAGS_DEVICE_UNCACHED, hwrtdata_common_init, hwrt,
343 &hwrt->common_fw_obj);
349 hwrt_fw_data_init(void *cpu_ptr, void *priv)
351 struct pvr_hwrt_data *hwrt_data = priv;
353 memcpy(cpu_ptr, &hwrt_data->data, sizeof(hwrt_data->data));
357 hwrt_data_init_fw_structure(struct pvr_file *pvr_file,
358 struct pvr_hwrt_dataset *hwrt,
359 struct drm_pvr_ioctl_create_hwrt_dataset_args *args,
360 struct drm_pvr_create_hwrt_rt_data_args *rt_data_args,
361 struct pvr_hwrt_data *hwrt_data)
363 struct drm_pvr_create_hwrt_geom_data_args *geom_data_args = &args->geom_data_args;
364 struct pvr_device *pvr_dev = pvr_file->pvr_dev;
365 struct rogue_fwif_rta_ctl *rta_ctl;
369 pvr_fw_object_get_fw_addr(hwrt->common_fw_obj,
370 &hwrt_data->data.hwrt_data_common_fw_addr);
372 for (free_list_i = 0; free_list_i < ARRAY_SIZE(hwrt->free_lists); free_list_i++) {
373 pvr_fw_object_get_fw_addr(hwrt->free_lists[free_list_i]->fw_obj,
374 &hwrt_data->data.freelists_fw_addr[free_list_i]);
377 hwrt_data->data.tail_ptrs_dev_addr = geom_data_args->tpc_dev_addr;
378 hwrt_data->data.vheap_table_dev_addr = geom_data_args->vheap_table_dev_addr;
379 hwrt_data->data.rtc_dev_addr = geom_data_args->rtc_dev_addr;
381 hwrt_data->data.pm_mlist_dev_addr = rt_data_args->pm_mlist_dev_addr;
382 hwrt_data->data.macrotile_array_dev_addr = rt_data_args->macrotile_array_dev_addr;
383 hwrt_data->data.rgn_header_dev_addr = rt_data_args->region_header_dev_addr;
385 rta_ctl = &hwrt_data->data.rta_ctl;
387 rta_ctl->render_target_index = 0;
388 rta_ctl->active_render_targets = 0;
389 rta_ctl->valid_render_targets_fw_addr = 0;
390 rta_ctl->rta_num_partial_renders_fw_addr = 0;
391 rta_ctl->max_rts = args->layers;
393 if (args->layers > 1) {
394 err = pvr_fw_object_create(pvr_dev, args->layers * SRTC_ENTRY_SIZE,
395 PVR_BO_FW_FLAGS_DEVICE_UNCACHED,
396 NULL, NULL, &hwrt_data->srtc_obj);
399 pvr_fw_object_get_fw_addr(hwrt_data->srtc_obj,
400 &rta_ctl->valid_render_targets_fw_addr);
402 err = pvr_fw_object_create(pvr_dev, args->layers * RAA_ENTRY_SIZE,
403 PVR_BO_FW_FLAGS_DEVICE_UNCACHED,
404 NULL, NULL, &hwrt_data->raa_obj);
406 goto err_put_shadow_rt_cache;
407 pvr_fw_object_get_fw_addr(hwrt_data->raa_obj,
408 &rta_ctl->rta_num_partial_renders_fw_addr);
411 err = pvr_fw_object_create(pvr_dev, sizeof(struct rogue_fwif_hwrtdata),
412 PVR_BO_FW_FLAGS_DEVICE_UNCACHED,
413 hwrt_fw_data_init, hwrt_data, &hwrt_data->fw_obj);
415 goto err_put_raa_obj;
417 pvr_free_list_add_hwrt(hwrt->free_lists[0], hwrt_data);
422 if (args->layers > 1)
423 pvr_fw_object_destroy(hwrt_data->raa_obj);
425 err_put_shadow_rt_cache:
426 if (args->layers > 1)
427 pvr_fw_object_destroy(hwrt_data->srtc_obj);
433 hwrt_data_fini_fw_structure(struct pvr_hwrt_dataset *hwrt, int hwrt_nr)
435 struct pvr_hwrt_data *hwrt_data = &hwrt->data[hwrt_nr];
437 pvr_free_list_remove_hwrt(hwrt->free_lists[0], hwrt_data);
439 if (hwrt->max_rts > 1) {
440 pvr_fw_object_destroy(hwrt_data->raa_obj);
441 pvr_fw_object_destroy(hwrt_data->srtc_obj);
444 pvr_fw_object_destroy(hwrt_data->fw_obj);
448 * pvr_hwrt_dataset_create() - Create a new HWRT dataset
449 * @pvr_file: Pointer to pvr_file structure.
450 * @args: Creation arguments from userspace.
453 * * Pointer to new HWRT, or
454 * * ERR_PTR(-%ENOMEM) on out of memory.
456 struct pvr_hwrt_dataset *
457 pvr_hwrt_dataset_create(struct pvr_file *pvr_file,
458 struct drm_pvr_ioctl_create_hwrt_dataset_args *args)
460 struct pvr_hwrt_dataset *hwrt;
463 /* Create and fill out the kernel structure */
464 hwrt = kzalloc(sizeof(*hwrt), GFP_KERNEL);
467 return ERR_PTR(-ENOMEM);
469 err = hwrt_init_kernel_structure(pvr_file, args, hwrt);
473 err = hwrt_init_common_fw_structure(pvr_file, args, hwrt);
475 goto err_fini_kernel_structure;
477 for (; i < ARRAY_SIZE(hwrt->data); i++) {
478 err = hwrt_data_init_fw_structure(pvr_file, hwrt, args,
479 &args->rt_data_args[i],
482 goto err_fini_data_structures;
484 hwrt->data[i].hwrt_dataset = hwrt;
487 kref_init(&hwrt->ref_count);
490 err_fini_data_structures:
492 hwrt_data_fini_fw_structure(hwrt, i);
494 err_fini_kernel_structure:
495 hwrt_fini_kernel_structure(hwrt);
504 pvr_hwrt_dataset_release(struct kref *ref_count)
506 struct pvr_hwrt_dataset *hwrt =
507 container_of(ref_count, struct pvr_hwrt_dataset, ref_count);
509 for (int i = ARRAY_SIZE(hwrt->data) - 1; i >= 0; i--) {
510 WARN_ON(pvr_fw_structure_cleanup(hwrt->pvr_dev, ROGUE_FWIF_CLEANUP_HWRTDATA,
511 hwrt->data[i].fw_obj, 0));
512 hwrt_data_fini_fw_structure(hwrt, i);
515 hwrt_fini_common_fw_structure(hwrt);
516 hwrt_fini_kernel_structure(hwrt);
522 * pvr_destroy_hwrt_datasets_for_file: Destroy any HWRT datasets associated
523 * with the given file.
524 * @pvr_file: Pointer to pvr_file structure.
526 * Removes all HWRT datasets associated with @pvr_file from the device
527 * hwrt_dataset list and drops initial references. HWRT datasets will then be
528 * destroyed once all outstanding references are dropped.
530 void pvr_destroy_hwrt_datasets_for_file(struct pvr_file *pvr_file)
532 struct pvr_hwrt_dataset *hwrt;
533 unsigned long handle;
535 xa_for_each(&pvr_file->hwrt_handles, handle, hwrt) {
537 pvr_hwrt_dataset_put(xa_erase(&pvr_file->hwrt_handles, handle));
542 * pvr_hwrt_dataset_put() - Release reference on HWRT dataset
543 * @hwrt: Pointer to HWRT dataset to release reference on
546 pvr_hwrt_dataset_put(struct pvr_hwrt_dataset *hwrt)
549 kref_put(&hwrt->ref_count, pvr_hwrt_dataset_release);