rga-hw.c (11453B)
1// SPDX-License-Identifier: GPL-2.0-only 2/* 3 * Copyright (C) Fuzhou Rockchip Electronics Co.Ltd 4 * Author: Jacob Chen <jacob-chen@iotwrt.com> 5 */ 6 7#include <linux/pm_runtime.h> 8 9#include "rga-hw.h" 10#include "rga.h" 11 12enum e_rga_start_pos { 13 LT = 0, 14 LB = 1, 15 RT = 2, 16 RB = 3, 17}; 18 19struct rga_addr_offset { 20 unsigned int y_off; 21 unsigned int u_off; 22 unsigned int v_off; 23}; 24 25struct rga_corners_addr_offset { 26 struct rga_addr_offset left_top; 27 struct rga_addr_offset right_top; 28 struct rga_addr_offset left_bottom; 29 struct rga_addr_offset right_bottom; 30}; 31 32static unsigned int rga_get_scaling(unsigned int src, unsigned int dst) 33{ 34 /* 35 * The rga hw scaling factor is a normalized inverse of the 36 * scaling factor. 37 * For example: When source width is 100 and destination width is 200 38 * (scaling of 2x), then the hw factor is NC * 100 / 200. 39 * The normalization factor (NC) is 2^16 = 0x10000. 40 */ 41 42 return (src > dst) ? ((dst << 16) / src) : ((src << 16) / dst); 43} 44 45static struct rga_corners_addr_offset 46rga_get_addr_offset(struct rga_frame *frm, unsigned int x, unsigned int y, 47 unsigned int w, unsigned int h) 48{ 49 struct rga_corners_addr_offset offsets; 50 struct rga_addr_offset *lt, *lb, *rt, *rb; 51 unsigned int x_div = 0, 52 y_div = 0, uv_stride = 0, pixel_width = 0, uv_factor = 0; 53 54 lt = &offsets.left_top; 55 lb = &offsets.left_bottom; 56 rt = &offsets.right_top; 57 rb = &offsets.right_bottom; 58 59 x_div = frm->fmt->x_div; 60 y_div = frm->fmt->y_div; 61 uv_factor = frm->fmt->uv_factor; 62 uv_stride = frm->stride / x_div; 63 pixel_width = frm->stride / frm->width; 64 65 lt->y_off = y * frm->stride + x * pixel_width; 66 lt->u_off = 67 frm->width * frm->height + (y / y_div) * uv_stride + x / x_div; 68 lt->v_off = lt->u_off + frm->width * frm->height / uv_factor; 69 70 lb->y_off = lt->y_off + (h - 1) * frm->stride; 71 lb->u_off = lt->u_off + (h / y_div - 1) * uv_stride; 72 lb->v_off = lt->v_off + (h / y_div - 1) * uv_stride; 73 74 rt->y_off = lt->y_off + (w - 1) * pixel_width; 75 rt->u_off = lt->u_off + w / x_div - 1; 76 rt->v_off = lt->v_off + w / x_div - 1; 77 78 rb->y_off = lb->y_off + (w - 1) * pixel_width; 79 rb->u_off = lb->u_off + w / x_div - 1; 80 rb->v_off = lb->v_off + w / x_div - 1; 81 82 return offsets; 83} 84 85static struct rga_addr_offset *rga_lookup_draw_pos(struct 86 rga_corners_addr_offset 87 * offsets, u32 rotate_mode, 88 u32 mirr_mode) 89{ 90 static enum e_rga_start_pos rot_mir_point_matrix[4][4] = { 91 { 92 LT, RT, LB, RB, 93 }, 94 { 95 RT, LT, RB, LB, 96 }, 97 { 98 RB, LB, RT, LT, 99 }, 100 { 101 LB, RB, LT, RT, 102 }, 103 }; 104 105 if (!offsets) 106 return NULL; 107 108 switch (rot_mir_point_matrix[rotate_mode][mirr_mode]) { 109 case LT: 110 return &offsets->left_top; 111 case LB: 112 return &offsets->left_bottom; 113 case RT: 114 return &offsets->right_top; 115 case RB: 116 return &offsets->right_bottom; 117 } 118 119 return NULL; 120} 121 122static void rga_cmd_set_src_addr(struct rga_ctx *ctx, void *mmu_pages) 123{ 124 struct rockchip_rga *rga = ctx->rga; 125 u32 *dest = rga->cmdbuf_virt; 126 unsigned int reg; 127 128 reg = RGA_MMU_SRC_BASE - RGA_MODE_BASE_REG; 129 dest[reg >> 2] = virt_to_phys(mmu_pages) >> 4; 130 131 reg = RGA_MMU_CTRL1 - RGA_MODE_BASE_REG; 132 dest[reg >> 2] |= 0x7; 133} 134 135static void rga_cmd_set_src1_addr(struct rga_ctx *ctx, void *mmu_pages) 136{ 137 struct rockchip_rga *rga = ctx->rga; 138 u32 *dest = rga->cmdbuf_virt; 139 unsigned int reg; 140 141 reg = RGA_MMU_SRC1_BASE - RGA_MODE_BASE_REG; 142 dest[reg >> 2] = virt_to_phys(mmu_pages) >> 4; 143 144 reg = RGA_MMU_CTRL1 - RGA_MODE_BASE_REG; 145 dest[reg >> 2] |= 0x7 << 4; 146} 147 148static void rga_cmd_set_dst_addr(struct rga_ctx *ctx, void *mmu_pages) 149{ 150 struct rockchip_rga *rga = ctx->rga; 151 u32 *dest = rga->cmdbuf_virt; 152 unsigned int reg; 153 154 reg = RGA_MMU_DST_BASE - RGA_MODE_BASE_REG; 155 dest[reg >> 2] = virt_to_phys(mmu_pages) >> 4; 156 157 reg = RGA_MMU_CTRL1 - RGA_MODE_BASE_REG; 158 dest[reg >> 2] |= 0x7 << 8; 159} 160 161static void rga_cmd_set_trans_info(struct rga_ctx *ctx) 162{ 163 struct rockchip_rga *rga = ctx->rga; 164 u32 *dest = rga->cmdbuf_virt; 165 unsigned int scale_dst_w, scale_dst_h; 166 unsigned int src_h, src_w, src_x, src_y, dst_h, dst_w, dst_x, dst_y; 167 union rga_src_info src_info; 168 union rga_dst_info dst_info; 169 union rga_src_x_factor x_factor; 170 union rga_src_y_factor y_factor; 171 union rga_src_vir_info src_vir_info; 172 union rga_src_act_info src_act_info; 173 union rga_dst_vir_info dst_vir_info; 174 union rga_dst_act_info dst_act_info; 175 176 struct rga_addr_offset *dst_offset; 177 struct rga_corners_addr_offset offsets; 178 struct rga_corners_addr_offset src_offsets; 179 180 src_h = ctx->in.crop.height; 181 src_w = ctx->in.crop.width; 182 src_x = ctx->in.crop.left; 183 src_y = ctx->in.crop.top; 184 dst_h = ctx->out.crop.height; 185 dst_w = ctx->out.crop.width; 186 dst_x = ctx->out.crop.left; 187 dst_y = ctx->out.crop.top; 188 189 src_info.val = dest[(RGA_SRC_INFO - RGA_MODE_BASE_REG) >> 2]; 190 dst_info.val = dest[(RGA_DST_INFO - RGA_MODE_BASE_REG) >> 2]; 191 x_factor.val = dest[(RGA_SRC_X_FACTOR - RGA_MODE_BASE_REG) >> 2]; 192 y_factor.val = dest[(RGA_SRC_Y_FACTOR - RGA_MODE_BASE_REG) >> 2]; 193 src_vir_info.val = dest[(RGA_SRC_VIR_INFO - RGA_MODE_BASE_REG) >> 2]; 194 src_act_info.val = dest[(RGA_SRC_ACT_INFO - RGA_MODE_BASE_REG) >> 2]; 195 dst_vir_info.val = dest[(RGA_DST_VIR_INFO - RGA_MODE_BASE_REG) >> 2]; 196 dst_act_info.val = dest[(RGA_DST_ACT_INFO - RGA_MODE_BASE_REG) >> 2]; 197 198 src_info.data.format = ctx->in.fmt->hw_format; 199 src_info.data.swap = ctx->in.fmt->color_swap; 200 dst_info.data.format = ctx->out.fmt->hw_format; 201 dst_info.data.swap = ctx->out.fmt->color_swap; 202 203 /* 204 * CSC mode must only be set when the colorspace families differ between 205 * input and output. It must remain unset (zeroed) if both are the same. 206 */ 207 208 if (RGA_COLOR_FMT_IS_YUV(ctx->in.fmt->hw_format) && 209 RGA_COLOR_FMT_IS_RGB(ctx->out.fmt->hw_format)) { 210 switch (ctx->in.colorspace) { 211 case V4L2_COLORSPACE_REC709: 212 src_info.data.csc_mode = RGA_SRC_CSC_MODE_BT709_R0; 213 break; 214 default: 215 src_info.data.csc_mode = RGA_SRC_CSC_MODE_BT601_R0; 216 break; 217 } 218 } 219 220 if (RGA_COLOR_FMT_IS_RGB(ctx->in.fmt->hw_format) && 221 RGA_COLOR_FMT_IS_YUV(ctx->out.fmt->hw_format)) { 222 switch (ctx->out.colorspace) { 223 case V4L2_COLORSPACE_REC709: 224 dst_info.data.csc_mode = RGA_SRC_CSC_MODE_BT709_R0; 225 break; 226 default: 227 dst_info.data.csc_mode = RGA_DST_CSC_MODE_BT601_R0; 228 break; 229 } 230 } 231 232 if (ctx->vflip) 233 src_info.data.mir_mode |= RGA_SRC_MIRR_MODE_X; 234 235 if (ctx->hflip) 236 src_info.data.mir_mode |= RGA_SRC_MIRR_MODE_Y; 237 238 switch (ctx->rotate) { 239 case 90: 240 src_info.data.rot_mode = RGA_SRC_ROT_MODE_90_DEGREE; 241 break; 242 case 180: 243 src_info.data.rot_mode = RGA_SRC_ROT_MODE_180_DEGREE; 244 break; 245 case 270: 246 src_info.data.rot_mode = RGA_SRC_ROT_MODE_270_DEGREE; 247 break; 248 default: 249 src_info.data.rot_mode = RGA_SRC_ROT_MODE_0_DEGREE; 250 break; 251 } 252 253 /* 254 * Calculate the up/down scaling mode/factor. 255 * 256 * RGA used to scale the picture first, and then rotate second, 257 * so we need to swap the w/h when rotate degree is 90/270. 258 */ 259 if (src_info.data.rot_mode == RGA_SRC_ROT_MODE_90_DEGREE || 260 src_info.data.rot_mode == RGA_SRC_ROT_MODE_270_DEGREE) { 261 if (rga->version.major == 0 || rga->version.minor == 0) { 262 if (dst_w == src_h) 263 src_h -= 8; 264 if (abs(src_w - dst_h) < 16) 265 src_w -= 16; 266 } 267 268 scale_dst_h = dst_w; 269 scale_dst_w = dst_h; 270 } else { 271 scale_dst_w = dst_w; 272 scale_dst_h = dst_h; 273 } 274 275 if (src_w == scale_dst_w) { 276 src_info.data.hscl_mode = RGA_SRC_HSCL_MODE_NO; 277 x_factor.val = 0; 278 } else if (src_w > scale_dst_w) { 279 src_info.data.hscl_mode = RGA_SRC_HSCL_MODE_DOWN; 280 x_factor.data.down_scale_factor = 281 rga_get_scaling(src_w, scale_dst_w) + 1; 282 } else { 283 src_info.data.hscl_mode = RGA_SRC_HSCL_MODE_UP; 284 x_factor.data.up_scale_factor = 285 rga_get_scaling(src_w - 1, scale_dst_w - 1); 286 } 287 288 if (src_h == scale_dst_h) { 289 src_info.data.vscl_mode = RGA_SRC_VSCL_MODE_NO; 290 y_factor.val = 0; 291 } else if (src_h > scale_dst_h) { 292 src_info.data.vscl_mode = RGA_SRC_VSCL_MODE_DOWN; 293 y_factor.data.down_scale_factor = 294 rga_get_scaling(src_h, scale_dst_h) + 1; 295 } else { 296 src_info.data.vscl_mode = RGA_SRC_VSCL_MODE_UP; 297 y_factor.data.up_scale_factor = 298 rga_get_scaling(src_h - 1, scale_dst_h - 1); 299 } 300 301 /* 302 * Calculate the framebuffer virtual strides and active size, 303 * note that the step of vir_stride / vir_width is 4 byte words 304 */ 305 src_vir_info.data.vir_stride = ctx->in.stride >> 2; 306 src_vir_info.data.vir_width = ctx->in.stride >> 2; 307 308 src_act_info.data.act_height = src_h - 1; 309 src_act_info.data.act_width = src_w - 1; 310 311 dst_vir_info.data.vir_stride = ctx->out.stride >> 2; 312 dst_act_info.data.act_height = dst_h - 1; 313 dst_act_info.data.act_width = dst_w - 1; 314 315 /* 316 * Calculate the source framebuffer base address with offset pixel. 317 */ 318 src_offsets = rga_get_addr_offset(&ctx->in, src_x, src_y, 319 src_w, src_h); 320 321 /* 322 * Configure the dest framebuffer base address with pixel offset. 323 */ 324 offsets = rga_get_addr_offset(&ctx->out, dst_x, dst_y, dst_w, dst_h); 325 dst_offset = rga_lookup_draw_pos(&offsets, src_info.data.rot_mode, 326 src_info.data.mir_mode); 327 328 dest[(RGA_SRC_Y_RGB_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 329 src_offsets.left_top.y_off; 330 dest[(RGA_SRC_CB_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 331 src_offsets.left_top.u_off; 332 dest[(RGA_SRC_CR_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 333 src_offsets.left_top.v_off; 334 335 dest[(RGA_SRC_X_FACTOR - RGA_MODE_BASE_REG) >> 2] = x_factor.val; 336 dest[(RGA_SRC_Y_FACTOR - RGA_MODE_BASE_REG) >> 2] = y_factor.val; 337 dest[(RGA_SRC_VIR_INFO - RGA_MODE_BASE_REG) >> 2] = src_vir_info.val; 338 dest[(RGA_SRC_ACT_INFO - RGA_MODE_BASE_REG) >> 2] = src_act_info.val; 339 340 dest[(RGA_SRC_INFO - RGA_MODE_BASE_REG) >> 2] = src_info.val; 341 342 dest[(RGA_DST_Y_RGB_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 343 dst_offset->y_off; 344 dest[(RGA_DST_CB_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 345 dst_offset->u_off; 346 dest[(RGA_DST_CR_BASE_ADDR - RGA_MODE_BASE_REG) >> 2] = 347 dst_offset->v_off; 348 349 dest[(RGA_DST_VIR_INFO - RGA_MODE_BASE_REG) >> 2] = dst_vir_info.val; 350 dest[(RGA_DST_ACT_INFO - RGA_MODE_BASE_REG) >> 2] = dst_act_info.val; 351 352 dest[(RGA_DST_INFO - RGA_MODE_BASE_REG) >> 2] = dst_info.val; 353} 354 355static void rga_cmd_set_mode(struct rga_ctx *ctx) 356{ 357 struct rockchip_rga *rga = ctx->rga; 358 u32 *dest = rga->cmdbuf_virt; 359 union rga_mode_ctrl mode; 360 union rga_alpha_ctrl0 alpha_ctrl0; 361 union rga_alpha_ctrl1 alpha_ctrl1; 362 363 mode.val = 0; 364 alpha_ctrl0.val = 0; 365 alpha_ctrl1.val = 0; 366 367 mode.data.gradient_sat = 1; 368 mode.data.render = RGA_MODE_RENDER_BITBLT; 369 mode.data.bitblt = RGA_MODE_BITBLT_MODE_SRC_TO_DST; 370 371 /* disable alpha blending */ 372 dest[(RGA_ALPHA_CTRL0 - RGA_MODE_BASE_REG) >> 2] = alpha_ctrl0.val; 373 dest[(RGA_ALPHA_CTRL1 - RGA_MODE_BASE_REG) >> 2] = alpha_ctrl1.val; 374 375 dest[(RGA_MODE_CTRL - RGA_MODE_BASE_REG) >> 2] = mode.val; 376} 377 378static void rga_cmd_set(struct rga_ctx *ctx) 379{ 380 struct rockchip_rga *rga = ctx->rga; 381 382 memset(rga->cmdbuf_virt, 0, RGA_CMDBUF_SIZE * 4); 383 384 rga_cmd_set_src_addr(ctx, rga->src_mmu_pages); 385 /* 386 * Due to hardware bug, 387 * src1 mmu also should be configured when using alpha blending. 388 */ 389 rga_cmd_set_src1_addr(ctx, rga->dst_mmu_pages); 390 391 rga_cmd_set_dst_addr(ctx, rga->dst_mmu_pages); 392 rga_cmd_set_mode(ctx); 393 394 rga_cmd_set_trans_info(ctx); 395 396 rga_write(rga, RGA_CMD_BASE, rga->cmdbuf_phy); 397 398 /* sync CMD buf for RGA */ 399 dma_sync_single_for_device(rga->dev, rga->cmdbuf_phy, 400 PAGE_SIZE, DMA_BIDIRECTIONAL); 401} 402 403void rga_hw_start(struct rockchip_rga *rga) 404{ 405 struct rga_ctx *ctx = rga->curr; 406 407 rga_cmd_set(ctx); 408 409 rga_write(rga, RGA_SYS_CTRL, 0x00); 410 411 rga_write(rga, RGA_SYS_CTRL, 0x22); 412 413 rga_write(rga, RGA_INT, 0x600); 414 415 rga_write(rga, RGA_CMD_CTRL, 0x1); 416}