hfi_buffer_iris2.h 56 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543
  1. /* SPDX-License-Identifier: GPL-2.0-only */
  2. /*
  3. * Copyright (c) 2020-2021,, The Linux Foundation. All rights reserved.
  4. */
  5. #ifndef __HFI_BUFFER_IRIS2__
  6. #define __HFI_BUFFER_IRIS2__
  7. #include <linux/types.h>
  8. #include "hfi_property.h"
  9. typedef u8 HFI_U8;
  10. typedef s8 HFI_S8;
  11. typedef u16 HFI_U16;
  12. typedef s16 HFI_S16;
  13. typedef u32 HFI_U32;
  14. typedef s32 HFI_S32;
  15. typedef u64 HFI_U64;
  16. typedef HFI_U32 HFI_BOOL;
  17. #ifndef MIN
  18. #define MIN(x, y) (((x) < (y)) ? (x) : (y))
  19. #endif
  20. #ifndef MAX
  21. #define MAX(x, y) (((x) > (y)) ? (x) : (y))
  22. #endif
  23. #define HFI_ALIGNMENT_4096 (4096)
  24. #define BUF_SIZE_ALIGN_16 (16)
  25. #define BUF_SIZE_ALIGN_32 (32)
  26. #define BUF_SIZE_ALIGN_64 (64)
  27. #define BUF_SIZE_ALIGN_128 (128)
  28. #define BUF_SIZE_ALIGN_256 (256)
  29. #define BUF_SIZE_ALIGN_512 (512)
  30. #define BUF_SIZE_ALIGN_4096 (4096)
  31. #define HFI_ALIGN(a, b) (((b) & ((b) - 1)) ? (((a) + (b) - 1) / \
  32. (b) * (b)) : (((a) + (b) - 1) & (~((b) - 1))))
  33. #define HFI_WORKMODE_1 1
  34. #define HFI_WORKMODE_2 2
  35. #define HFI_DEFAULT_METADATA_STRIDE_MULTIPLE (64)
  36. #define HFI_DEFAULT_METADATA_BUFFERHEIGHT_MULTIPLE (16)
  37. #define HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_HEIGHT (8)
  38. #define HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_WIDTH (32)
  39. #define HFI_COLOR_FORMAT_YUV420_NV12_UBWC_UV_TILE_HEIGHT (8)
  40. #define HFI_COLOR_FORMAT_YUV420_NV12_UBWC_UV_TILE_WIDTH (16)
  41. #define HFI_COLOR_FORMAT_YUV420_TP10_UBWC_Y_TILE_HEIGHT (4)
  42. #define HFI_COLOR_FORMAT_YUV420_TP10_UBWC_Y_TILE_WIDTH (48)
  43. #define HFI_COLOR_FORMAT_YUV420_TP10_UBWC_UV_TILE_HEIGHT (4)
  44. #define HFI_COLOR_FORMAT_YUV420_TP10_UBWC_UV_TILE_WIDTH (24)
  45. #define HFI_COLOR_FORMAT_RGBA8888_UBWC_TILE_HEIGHT (4)
  46. #define HFI_COLOR_FORMAT_RGBA8888_UBWC_TILE_WIDTH (16)
  47. #define HFI_NV12_IL_CALC_Y_STRIDE(stride, frame_width, stride_multiple) \
  48. stride = HFI_ALIGN(frame_width, stride_multiple)
  49. #define HFI_NV12_IL_CALC_Y_BUFHEIGHT(buf_height, frame_height, \
  50. min_buf_height_multiple) buf_height = HFI_ALIGN(frame_height, \
  51. min_buf_height_multiple)
  52. #define HFI_NV12_IL_CALC_UV_STRIDE(stride, frame_width, stride_multiple) \
  53. stride = HFI_ALIGN(frame_width, stride_multiple)
  54. #define HFI_NV12_IL_CALC_UV_BUFHEIGHT(buf_height, frame_height, \
  55. min_buf_height_multiple) buf_height = HFI_ALIGN(((frame_height + 1) \
  56. >> 1), min_buf_height_multiple)
  57. #define HFI_NV12_IL_CALC_BUF_SIZE(buf_size, y_bufSize, y_stride, y_buf_height, \
  58. uv_buf_size, uv_stride, uv_buf_height) \
  59. y_bufSize = (y_stride * y_buf_height); \
  60. uv_buf_size = (uv_stride * uv_buf_height); \
  61. buf_size = HFI_ALIGN(y_bufSize + uv_buf_size, HFI_ALIGNMENT_4096)
  62. #define HFI_NV12_UBWC_IL_CALC_Y_BUF_SIZE(y_bufSize, y_stride, y_buf_height) \
  63. y_bufSize = HFI_ALIGN(y_stride * y_buf_height, HFI_ALIGNMENT_4096)
  64. #define HFI_NV12_UBWC_IL_CALC_UV_BUF_SIZE(uv_buf_size, \
  65. uv_stride, uv_buf_height) \
  66. uv_buf_size = HFI_ALIGN(uv_stride * uv_buf_height, HFI_ALIGNMENT_4096)
  67. #define HFI_NV12_UBWC_IL_CALC_BUF_SIZE_V2(buf_size,\
  68. frame_width, frame_height, y_stride_multiple,\
  69. y_buffer_height_multiple, uv_stride_multiple, \
  70. uv_buffer_height_multiple, y_metadata_stride_multiple, \
  71. y_metadata_buffer_height_multiple, \
  72. uv_metadata_stride_multiple, uv_metadata_buffer_height_multiple) \
  73. do \
  74. { \
  75. HFI_U32 y_buf_size, uv_buf_size, y_meta_size, uv_meta_size; \
  76. HFI_U32 stride, _height; \
  77. HFI_U32 half_height = (frame_height + 1) >> 1; \
  78. HFI_NV12_IL_CALC_Y_STRIDE(stride, frame_width,\
  79. y_stride_multiple); \
  80. HFI_NV12_IL_CALC_Y_BUFHEIGHT(_height, half_height,\
  81. y_buffer_height_multiple); \
  82. HFI_NV12_UBWC_IL_CALC_Y_BUF_SIZE(y_buf_size, stride, _height);\
  83. HFI_NV12_IL_CALC_UV_STRIDE(stride, frame_width, \
  84. uv_stride_multiple); \
  85. HFI_NV12_IL_CALC_UV_BUFHEIGHT(_height, half_height, \
  86. uv_buffer_height_multiple); \
  87. HFI_NV12_UBWC_IL_CALC_UV_BUF_SIZE(uv_buf_size, stride, _height);\
  88. HFI_UBWC_CALC_METADATA_PLANE_STRIDE(stride, frame_width,\
  89. y_metadata_stride_multiple, \
  90. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_WIDTH);\
  91. HFI_UBWC_METADATA_PLANE_BUFHEIGHT(_height, half_height, \
  92. y_metadata_buffer_height_multiple,\
  93. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_HEIGHT);\
  94. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(y_meta_size, stride, \
  95. _height); \
  96. HFI_UBWC_UV_METADATA_PLANE_STRIDE(stride, frame_width,\
  97. uv_metadata_stride_multiple, \
  98. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_UV_TILE_WIDTH); \
  99. HFI_UBWC_UV_METADATA_PLANE_BUFHEIGHT(_height, half_height,\
  100. uv_metadata_buffer_height_multiple,\
  101. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_UV_TILE_HEIGHT);\
  102. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(uv_meta_size, stride, \
  103. _height); \
  104. buf_size = (y_buf_size + uv_buf_size + y_meta_size + \
  105. uv_meta_size) << 1;\
  106. } while (0)
  107. #define HFI_YUV420_TP10_CALC_Y_STRIDE(stride, frame_width, stride_multiple) \
  108. stride = HFI_ALIGN(frame_width, 192); \
  109. stride = HFI_ALIGN(stride * 4 / 3, stride_multiple)
  110. #define HFI_YUV420_TP10_CALC_Y_BUFHEIGHT(buf_height, frame_height, \
  111. min_buf_height_multiple) \
  112. buf_height = HFI_ALIGN(frame_height, min_buf_height_multiple)
  113. #define HFI_YUV420_TP10_CALC_UV_STRIDE(stride, frame_width, stride_multiple) \
  114. stride = HFI_ALIGN(frame_width, 192); \
  115. stride = HFI_ALIGN(stride * 4 / 3, stride_multiple)
  116. #define HFI_YUV420_TP10_CALC_UV_BUFHEIGHT(buf_height, frame_height, \
  117. min_buf_height_multiple) \
  118. buf_height = HFI_ALIGN(((frame_height + 1) >> 1), \
  119. min_buf_height_multiple)
  120. #define HFI_YUV420_TP10_CALC_BUF_SIZE(buf_size, y_buf_size, y_stride,\
  121. y_buf_height, uv_buf_size, uv_stride, uv_buf_height) \
  122. y_buf_size = (y_stride * y_buf_height); \
  123. uv_buf_size = (uv_stride * uv_buf_height); \
  124. buf_size = y_buf_size + uv_buf_size
  125. #define HFI_YUV420_TP10_UBWC_CALC_Y_BUF_SIZE(y_buf_size, y_stride, \
  126. y_buf_height) \
  127. y_buf_size = HFI_ALIGN(y_stride * y_buf_height, HFI_ALIGNMENT_4096)
  128. #define HFI_YUV420_TP10_UBWC_CALC_UV_BUF_SIZE(uv_buf_size, uv_stride, \
  129. uv_buf_height) \
  130. uv_buf_size = HFI_ALIGN(uv_stride * uv_buf_height, HFI_ALIGNMENT_4096)
  131. #define HFI_YUV420_TP10_UBWC_CALC_BUF_SIZE(buf_size, y_stride, y_buf_height, \
  132. uv_stride, uv_buf_height, y_md_stride, y_md_height, uv_md_stride, \
  133. uv_md_height)\
  134. do \
  135. { \
  136. HFI_U32 y_data_size, uv_data_size, y_md_size, uv_md_size; \
  137. HFI_YUV420_TP10_UBWC_CALC_Y_BUF_SIZE(y_data_size, y_stride,\
  138. y_buf_height); \
  139. HFI_YUV420_TP10_UBWC_CALC_UV_BUF_SIZE(uv_data_size, uv_stride, \
  140. uv_buf_height); \
  141. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(y_md_size, y_md_stride, \
  142. y_md_height); \
  143. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(uv_md_size, uv_md_stride, \
  144. uv_md_height); \
  145. buf_size = y_data_size + uv_data_size + y_md_size + \
  146. uv_md_size; \
  147. } while (0)
  148. #define HFI_YUV420_P010_CALC_Y_STRIDE(stride, frame_width, stride_multiple) \
  149. stride = HFI_ALIGN(frame_width * 2, stride_multiple)
  150. #define HFI_YUV420_P010_CALC_Y_BUFHEIGHT(buf_height, frame_height, \
  151. min_buf_height_multiple) \
  152. buf_height = HFI_ALIGN(frame_height, min_buf_height_multiple)
  153. #define HFI_YUV420_P010_CALC_UV_STRIDE(stride, frame_width, stride_multiple) \
  154. stride = HFI_ALIGN(frame_width * 2, stride_multiple)
  155. #define HFI_YUV420_P010_CALC_UV_BUFHEIGHT(buf_height, frame_height, \
  156. min_buf_height_multiple) \
  157. buf_height = HFI_ALIGN(((frame_height + 1) >> 1), \
  158. min_buf_height_multiple)
  159. #define HFI_YUV420_P010_CALC_BUF_SIZE(buf_size, y_data_size, y_stride, \
  160. y_buf_height, uv_data_size, uv_stride, uv_buf_height) \
  161. do \
  162. { \
  163. y_data_size = HFI_ALIGN(y_stride * y_buf_height, \
  164. HFI_ALIGNMENT_4096);\
  165. uv_data_size = HFI_ALIGN(uv_stride * uv_buf_height, \
  166. HFI_ALIGNMENT_4096); \
  167. buf_size = y_data_size + uv_data_size; \
  168. } while (0)
  169. #define HFI_RGB888_CALC_STRIDE(stride, frame_width, stride_multiple) \
  170. stride = ((frame_width * 3) + stride_multiple - 1) & \
  171. (0xffffffff - (stride_multiple - 1))
  172. #define HFI_RGB888_CALC_BUFHEIGHT(buf_height, frame_height, \
  173. min_buf_height_multiple) \
  174. buf_height = ((frame_height + min_buf_height_multiple - 1) & \
  175. (0xffffffff - (min_buf_height_multiple - 1)))
  176. #define HFI_RGB888_CALC_BUF_SIZE(buf_size, stride, buf_height) \
  177. buf_size = ((stride) * (buf_height))
  178. #define HFI_RGBA8888_CALC_STRIDE(stride, frame_width, stride_multiple) \
  179. stride = HFI_ALIGN((frame_width << 2), stride_multiple)
  180. #define HFI_RGBA8888_CALC_BUFHEIGHT(buf_height, frame_height, \
  181. min_buf_height_multiple) \
  182. buf_height = HFI_ALIGN(frame_height, min_buf_height_multiple)
  183. #define HFI_RGBA8888_CALC_BUF_SIZE(buf_size, stride, buf_height) \
  184. buf_size = (stride) * (buf_height)
  185. #define HFI_RGBA8888_UBWC_CALC_DATA_PLANE_BUF_SIZE(buf_size, stride, \
  186. buf_height) \
  187. buf_size = HFI_ALIGN((stride) * (buf_height), HFI_ALIGNMENT_4096)
  188. #define HFI_RGBA8888_UBWC_BUF_SIZE(buf_size, data_buf_size, \
  189. metadata_buffer_size, stride, buf_height, _metadata_tride, \
  190. _metadata_buf_height) \
  191. HFI_RGBA8888_UBWC_CALC_DATA_PLANE_BUF_SIZE(data_buf_size, \
  192. stride, buf_height); \
  193. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(metadata_buffer_size, \
  194. _metadata_tride, _metadata_buf_height); \
  195. buf_size = data_buf_size + metadata_buffer_size
  196. #define HFI_UBWC_CALC_METADATA_PLANE_STRIDE(metadata_stride, frame_width,\
  197. metadata_stride_multiple, tile_width_in_pels) \
  198. metadata_stride = HFI_ALIGN(((frame_width + (tile_width_in_pels - 1)) /\
  199. tile_width_in_pels), metadata_stride_multiple)
  200. #define HFI_UBWC_METADATA_PLANE_BUFHEIGHT(metadata_buf_height, frame_height, \
  201. metadata_height_multiple, tile_height_in_pels) \
  202. metadata_buf_height = HFI_ALIGN(((frame_height + \
  203. (tile_height_in_pels - 1)) / tile_height_in_pels), \
  204. metadata_height_multiple)
  205. #define HFI_UBWC_UV_METADATA_PLANE_STRIDE(metadata_stride, frame_width, \
  206. metadata_stride_multiple, tile_width_in_pels) \
  207. metadata_stride = HFI_ALIGN(((((frame_width + 1) >> 1) +\
  208. (tile_width_in_pels - 1)) / tile_width_in_pels), \
  209. metadata_stride_multiple)
  210. #define HFI_UBWC_UV_METADATA_PLANE_BUFHEIGHT(metadata_buf_height, frame_height,\
  211. metadata_height_multiple, tile_height_in_pels) \
  212. metadata_buf_height = HFI_ALIGN(((((frame_height + 1) >> 1) + \
  213. (tile_height_in_pels - 1)) / tile_height_in_pels), \
  214. metadata_height_multiple)
  215. #define HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(buffer_size, _metadata_tride, \
  216. _metadata_buf_height) \
  217. buffer_size = HFI_ALIGN(_metadata_tride * _metadata_buf_height, \
  218. HFI_ALIGNMENT_4096)
  219. #define BUFFER_ALIGNMENT_512_BYTES 512
  220. #define BUFFER_ALIGNMENT_256_BYTES 256
  221. #define BUFFER_ALIGNMENT_128_BYTES 128
  222. #define BUFFER_ALIGNMENT_64_BYTES 64
  223. #define BUFFER_ALIGNMENT_32_BYTES 32
  224. #define BUFFER_ALIGNMENT_16_BYTES 16
  225. #define BUFFER_ALIGNMENT_8_BYTES 8
  226. #define BUFFER_ALIGNMENT_4_BYTES 4
  227. #define VENUS_DMA_ALIGNMENT BUFFER_ALIGNMENT_256_BYTES
  228. #define MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE 64
  229. #define MAX_FE_NBR_CTRL_LCU32_LINE_BUFFER_SIZE 64
  230. #define MAX_FE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE 64
  231. #define MAX_FE_NBR_DATA_LUMA_LINE_BUFFER_SIZE 640
  232. #define MAX_FE_NBR_DATA_CB_LINE_BUFFER_SIZE 320
  233. #define MAX_FE_NBR_DATA_CR_LINE_BUFFER_SIZE 320
  234. #define MAX_SE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE (128 / 8)
  235. #define MAX_SE_NBR_CTRL_LCU32_LINE_BUFFER_SIZE (128 / 8)
  236. #define MAX_SE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE (128 / 8)
  237. #define MAX_PE_NBR_DATA_LCU64_LINE_BUFFER_SIZE (64 * 2 * 3)
  238. #define MAX_PE_NBR_DATA_LCU32_LINE_BUFFER_SIZE (32 * 2 * 3)
  239. #define MAX_PE_NBR_DATA_LCU16_LINE_BUFFER_SIZE (16 * 2 * 3)
  240. #define MAX_TILE_COLUMNS 32
  241. #define SIZE_VPSS_LB(Size, frame_width, frame_height, num_vpp_pipes) \
  242. do \
  243. { \
  244. HFI_U32 vpss_4tap_top_buffer_size, vpss_div2_top_buffer_size, \
  245. vpss_4tap_left_buffer_size, vpss_div2_left_buffer_size; \
  246. HFI_U32 opb_wr_top_line_luma_buffer_size, \
  247. opb_wr_top_line_chroma_buffer_size, \
  248. opb_lb_wr_llb_y_buffer_size,\
  249. opb_lb_wr_llb_uv_buffer_size; \
  250. HFI_U32 macrotiling_size; \
  251. vpss_4tap_top_buffer_size = vpss_div2_top_buffer_size = \
  252. vpss_4tap_left_buffer_size = vpss_div2_left_buffer_size = 0; \
  253. macrotiling_size = 32; \
  254. opb_wr_top_line_luma_buffer_size = HFI_ALIGN(frame_width, \
  255. macrotiling_size) / macrotiling_size * 256; \
  256. opb_wr_top_line_luma_buffer_size = \
  257. HFI_ALIGN(opb_wr_top_line_luma_buffer_size, \
  258. VENUS_DMA_ALIGNMENT) + (MAX_TILE_COLUMNS - 1) * 256; \
  259. opb_wr_top_line_luma_buffer_size = \
  260. MAX(opb_wr_top_line_luma_buffer_size, (32 * \
  261. HFI_ALIGN(frame_height, 8))); \
  262. opb_wr_top_line_chroma_buffer_size = \
  263. opb_wr_top_line_luma_buffer_size;\
  264. opb_lb_wr_llb_uv_buffer_size = opb_lb_wr_llb_y_buffer_size = \
  265. HFI_ALIGN((HFI_ALIGN(frame_height, 8) / (4 / 2)) * 64,\
  266. BUFFER_ALIGNMENT_32_BYTES); \
  267. Size = num_vpp_pipes * 2 * (vpss_4tap_top_buffer_size + \
  268. vpss_div2_top_buffer_size) + \
  269. 2 * (vpss_4tap_left_buffer_size + \
  270. vpss_div2_left_buffer_size) + \
  271. opb_wr_top_line_luma_buffer_size + \
  272. opb_wr_top_line_chroma_buffer_size + \
  273. opb_lb_wr_llb_uv_buffer_size + \
  274. opb_lb_wr_llb_y_buffer_size; \
  275. } while (0)
  276. #define VPP_CMD_MAX_SIZE (1 << 20)
  277. #define NUM_HW_PIC_BUF 32
  278. #define BIN_BUFFER_THRESHOLD (1280 * 736)
  279. #define H264D_MAX_SLICE 1800
  280. #define SIZE_H264D_BUFTAB_T (256)
  281. #define SIZE_H264D_HW_PIC_T (1 << 11)
  282. #define SIZE_H264D_BSE_CMD_PER_BUF (32 * 4)
  283. #define SIZE_H264D_VPP_CMD_PER_BUF (512)
  284. #define SIZE_H264D_LB_FE_TOP_DATA(frame_width, frame_height) \
  285. (MAX_FE_NBR_DATA_LUMA_LINE_BUFFER_SIZE * HFI_ALIGN(frame_width, 16) * 3)
  286. #define SIZE_H264D_LB_FE_TOP_CTRL(frame_width, frame_height) \
  287. (MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * ((frame_width + 15) >> 4))
  288. #define SIZE_H264D_LB_FE_LEFT_CTRL(frame_width, frame_height) \
  289. (MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * ((frame_height + 15) >> 4))
  290. #define SIZE_H264D_LB_SE_TOP_CTRL(frame_width, frame_height) \
  291. (MAX_SE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * ((frame_width + 15) >> 4))
  292. #define SIZE_H264D_LB_SE_LEFT_CTRL(frame_width, frame_height) \
  293. (MAX_SE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * ((frame_height + 15) >> 4))
  294. #define SIZE_H264D_LB_PE_TOP_DATA(frame_width, frame_height) \
  295. (MAX_PE_NBR_DATA_LCU64_LINE_BUFFER_SIZE * ((frame_width + 15) >> 4))
  296. #define SIZE_H264D_LB_VSP_TOP(frame_width, frame_height) \
  297. ((((frame_width + 15) >> 4) << 7))
  298. #define SIZE_H264D_LB_RECON_DMA_METADATA_WR(frame_width, frame_height) \
  299. (HFI_ALIGN(frame_height, 16) * 32)
  300. #define SIZE_H264D_QP(frame_width, frame_height) \
  301. (((frame_width + 63) >> 6) * ((frame_height + 63) >> 6) * 128)
  302. #define SIZE_HW_PIC(size_per_buf) \
  303. (NUM_HW_PIC_BUF * size_per_buf)
  304. #define SIZE_H264D_BSE_CMD_BUF(_size, frame_width, frame_height) \
  305. do \
  306. { \
  307. HFI_U32 _height = HFI_ALIGN(frame_height, \
  308. BUFFER_ALIGNMENT_32_BYTES); \
  309. _size = MIN((((_height + 15) >> 4) * 3 * 4), H264D_MAX_SLICE) *\
  310. SIZE_H264D_BSE_CMD_PER_BUF; \
  311. } while (0)
  312. #define SIZE_H264D_VPP_CMD_BUF(_size, frame_width, frame_height) \
  313. do \
  314. { \
  315. HFI_U32 _height = HFI_ALIGN(frame_height, \
  316. BUFFER_ALIGNMENT_32_BYTES); \
  317. _size = MIN((((_height + 15) >> 4) * 3 * 4), H264D_MAX_SLICE) * \
  318. SIZE_H264D_VPP_CMD_PER_BUF; \
  319. if (_size > VPP_CMD_MAX_SIZE) { _size = VPP_CMD_MAX_SIZE; } \
  320. } while (0)
  321. #define HFI_BUFFER_COMV_H264D(coMV_size, frame_width, \
  322. frame_height, _yuv_bufcount_min) \
  323. do \
  324. { \
  325. HFI_U32 frame_width_in_mbs = ((frame_width + 15) >> 4); \
  326. HFI_U32 frame_height_in_mbs = ((frame_height + 15) >> 4); \
  327. HFI_U32 col_mv_aligned_width = (frame_width_in_mbs << 7); \
  328. HFI_U32 col_zero_aligned_width = (frame_width_in_mbs << 2); \
  329. HFI_U32 col_zero_size = 0, size_colloc = 0; \
  330. col_mv_aligned_width = HFI_ALIGN(col_mv_aligned_width, \
  331. BUFFER_ALIGNMENT_16_BYTES); \
  332. col_zero_aligned_width = HFI_ALIGN(col_zero_aligned_width, \
  333. BUFFER_ALIGNMENT_16_BYTES); \
  334. col_zero_size = col_zero_aligned_width * \
  335. ((frame_height_in_mbs + 1) >> 1); \
  336. col_zero_size = HFI_ALIGN(col_zero_size, \
  337. BUFFER_ALIGNMENT_64_BYTES); \
  338. col_zero_size <<= 1; \
  339. col_zero_size = HFI_ALIGN(col_zero_size, \
  340. BUFFER_ALIGNMENT_512_BYTES); \
  341. size_colloc = col_mv_aligned_width * ((frame_height_in_mbs + \
  342. 1) >> 1); \
  343. size_colloc = HFI_ALIGN(size_colloc, \
  344. BUFFER_ALIGNMENT_64_BYTES); \
  345. size_colloc <<= 1; \
  346. size_colloc = HFI_ALIGN(size_colloc, \
  347. BUFFER_ALIGNMENT_512_BYTES); \
  348. size_colloc += (col_zero_size + SIZE_H264D_BUFTAB_T * 2); \
  349. coMV_size = size_colloc * (_yuv_bufcount_min); \
  350. coMV_size += BUFFER_ALIGNMENT_512_BYTES; \
  351. } while (0)
  352. #define HFI_BUFFER_NON_COMV_H264D(_size, frame_width, frame_height, \
  353. num_vpp_pipes) \
  354. do \
  355. { \
  356. HFI_U32 _size_bse, _size_vpp; \
  357. SIZE_H264D_BSE_CMD_BUF(_size_bse, frame_width, frame_height); \
  358. SIZE_H264D_VPP_CMD_BUF(_size_vpp, frame_width, frame_height); \
  359. _size = HFI_ALIGN(_size_bse, VENUS_DMA_ALIGNMENT) + \
  360. HFI_ALIGN(_size_vpp, VENUS_DMA_ALIGNMENT) + \
  361. HFI_ALIGN(SIZE_HW_PIC(SIZE_H264D_HW_PIC_T), \
  362. VENUS_DMA_ALIGNMENT); \
  363. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  364. } while (0)
  365. #define HFI_BUFFER_LINE_H264D(_size, frame_width, frame_height, \
  366. is_opb, num_vpp_pipes) \
  367. do \
  368. { \
  369. HFI_U32 vpss_lb_size = 0; \
  370. _size = HFI_ALIGN(SIZE_H264D_LB_FE_TOP_DATA(frame_width, \
  371. frame_height), VENUS_DMA_ALIGNMENT) + \
  372. HFI_ALIGN(SIZE_H264D_LB_FE_TOP_CTRL(frame_width, \
  373. frame_height), VENUS_DMA_ALIGNMENT) + \
  374. HFI_ALIGN(SIZE_H264D_LB_FE_LEFT_CTRL(frame_width, \
  375. frame_height), VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  376. HFI_ALIGN(SIZE_H264D_LB_SE_TOP_CTRL(frame_width, \
  377. frame_height), VENUS_DMA_ALIGNMENT) + \
  378. HFI_ALIGN(SIZE_H264D_LB_SE_LEFT_CTRL(frame_width, \
  379. frame_height), VENUS_DMA_ALIGNMENT) * \
  380. num_vpp_pipes + \
  381. HFI_ALIGN(SIZE_H264D_LB_PE_TOP_DATA(frame_width, \
  382. frame_height), VENUS_DMA_ALIGNMENT) + \
  383. HFI_ALIGN(SIZE_H264D_LB_VSP_TOP(frame_width, \
  384. frame_height), VENUS_DMA_ALIGNMENT) + \
  385. HFI_ALIGN(SIZE_H264D_LB_RECON_DMA_METADATA_WR\
  386. (frame_width, frame_height), \
  387. VENUS_DMA_ALIGNMENT) * 2 + HFI_ALIGN(SIZE_H264D_QP\
  388. (frame_width, frame_height), VENUS_DMA_ALIGNMENT); \
  389. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  390. if (is_opb) \
  391. { \
  392. SIZE_VPSS_LB(vpss_lb_size, frame_width, frame_height, \
  393. num_vpp_pipes); \
  394. } \
  395. _size = HFI_ALIGN((_size + vpss_lb_size), \
  396. VENUS_DMA_ALIGNMENT); \
  397. } while (0)
  398. #define H264_CABAC_HDR_RATIO_HD_TOT 1
  399. #define H264_CABAC_RES_RATIO_HD_TOT 3
  400. #define SIZE_H264D_HW_BIN_BUFFER(_size, frame_width, frame_height, \
  401. delay, num_vpp_pipes) \
  402. do \
  403. { \
  404. HFI_U32 size_yuv, size_bin_hdr, size_bin_res; \
  405. size_yuv = ((frame_width * frame_height) <= \
  406. BIN_BUFFER_THRESHOLD) ?\
  407. ((BIN_BUFFER_THRESHOLD * 3) >> 1) : \
  408. ((frame_width * frame_height * 3) >> 1); \
  409. size_bin_hdr = size_yuv * H264_CABAC_HDR_RATIO_HD_TOT; \
  410. size_bin_res = size_yuv * H264_CABAC_RES_RATIO_HD_TOT; \
  411. size_bin_hdr = size_bin_hdr * (((((HFI_U32)(delay)) & 31) /\
  412. 10) + 2) / 2; \
  413. size_bin_res = size_bin_res * (((((HFI_U32)(delay)) & 31) /\
  414. 10) + 2) / 2; \
  415. size_bin_hdr = HFI_ALIGN(size_bin_hdr / num_vpp_pipes,\
  416. VENUS_DMA_ALIGNMENT) * num_vpp_pipes; \
  417. size_bin_res = HFI_ALIGN(size_bin_res / num_vpp_pipes, \
  418. VENUS_DMA_ALIGNMENT) * num_vpp_pipes; \
  419. _size = size_bin_hdr + size_bin_res; \
  420. } while (0)
  421. #define HFI_BUFFER_BIN_H264D(_size, frame_width, frame_height, is_interlaced, \
  422. delay, num_vpp_pipes) \
  423. do \
  424. { \
  425. HFI_U32 n_aligned_w = HFI_ALIGN(frame_width, \
  426. BUFFER_ALIGNMENT_16_BYTES);\
  427. HFI_U32 n_aligned_h = HFI_ALIGN(frame_height, \
  428. BUFFER_ALIGNMENT_16_BYTES); \
  429. if (!is_interlaced) \
  430. { \
  431. SIZE_H264D_HW_BIN_BUFFER(_size, n_aligned_w, \
  432. n_aligned_h, delay, num_vpp_pipes); \
  433. } \
  434. else \
  435. { \
  436. _size = 0; \
  437. } \
  438. } while (0)
  439. #define NUM_SLIST_BUF_H264 (256 + 32)
  440. #define SIZE_SLIST_BUF_H264 (512)
  441. #define SIZE_SEI_USERDATA (4096)
  442. #define HFI_BUFFER_PERSIST_H264D(_size) \
  443. _size = HFI_ALIGN((SIZE_SLIST_BUF_H264 * NUM_SLIST_BUF_H264 + \
  444. NUM_HW_PIC_BUF * SIZE_SEI_USERDATA), VENUS_DMA_ALIGNMENT)
  445. #define LCU_MAX_SIZE_PELS 64
  446. #define LCU_MIN_SIZE_PELS 16
  447. #define H265D_MAX_SLICE 1200
  448. #define SIZE_H265D_HW_PIC_T SIZE_H264D_HW_PIC_T
  449. #define SIZE_H265D_BSE_CMD_PER_BUF (16 * sizeof(HFI_U32))
  450. #define SIZE_H265D_VPP_CMD_PER_BUF (256)
  451. #define SIZE_H265D_LB_FE_TOP_DATA(frame_width, frame_height) \
  452. (MAX_FE_NBR_DATA_LUMA_LINE_BUFFER_SIZE * \
  453. (HFI_ALIGN(frame_width, 64) + 8) * 2)
  454. #define SIZE_H265D_LB_FE_TOP_CTRL(frame_width, frame_height) \
  455. (MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * \
  456. (HFI_ALIGN(frame_width, LCU_MAX_SIZE_PELS) / LCU_MIN_SIZE_PELS))
  457. #define SIZE_H265D_LB_FE_LEFT_CTRL(frame_width, frame_height) \
  458. (MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE * \
  459. (HFI_ALIGN(frame_height, LCU_MAX_SIZE_PELS) / LCU_MIN_SIZE_PELS))
  460. #define SIZE_H265D_LB_SE_TOP_CTRL(frame_width, frame_height) \
  461. ((LCU_MAX_SIZE_PELS / 8 * (128 / 8)) * ((frame_width + 15) >> 4))
  462. #define SIZE_H265D_LB_SE_LEFT_CTRL(frame_width, frame_height) \
  463. (MAX(((frame_height + 16 - 1) / 8) * \
  464. MAX_SE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE, \
  465. MAX(((frame_height + 32 - 1) / 8) * \
  466. MAX_SE_NBR_CTRL_LCU32_LINE_BUFFER_SIZE, \
  467. ((frame_height + 64 - 1) / 8) * \
  468. MAX_SE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE)))
  469. #define SIZE_H265D_LB_PE_TOP_DATA(frame_width, frame_height) \
  470. (MAX_PE_NBR_DATA_LCU64_LINE_BUFFER_SIZE * (HFI_ALIGN(frame_width, \
  471. LCU_MIN_SIZE_PELS) / LCU_MIN_SIZE_PELS))
  472. #define SIZE_H265D_LB_VSP_TOP(frame_width, frame_height) \
  473. (((frame_width + 63) >> 6) * 128)
  474. #define SIZE_H265D_LB_VSP_LEFT(frame_width, frame_height) \
  475. (((frame_height + 63) >> 6) * 128)
  476. #define SIZE_H265D_LB_RECON_DMA_METADATA_WR(frame_width, frame_height) \
  477. SIZE_H264D_LB_RECON_DMA_METADATA_WR(frame_width, frame_height)
  478. #define SIZE_H265D_QP(frame_width, frame_height) \
  479. SIZE_H264D_QP(frame_width, frame_height)
  480. #define SIZE_H265D_BSE_CMD_BUF(_size, frame_width, frame_height)\
  481. do \
  482. { \
  483. _size = HFI_ALIGN(((HFI_ALIGN(frame_width, \
  484. LCU_MAX_SIZE_PELS) / LCU_MIN_SIZE_PELS) * \
  485. (HFI_ALIGN(frame_height, LCU_MAX_SIZE_PELS) /\
  486. LCU_MIN_SIZE_PELS)) * NUM_HW_PIC_BUF, VENUS_DMA_ALIGNMENT); \
  487. _size = MIN(_size, H265D_MAX_SLICE + 1); \
  488. _size = 2 * _size * SIZE_H265D_BSE_CMD_PER_BUF; \
  489. } while (0)
  490. #define SIZE_H265D_VPP_CMD_BUF(_size, frame_width, frame_height) \
  491. do \
  492. { \
  493. _size = HFI_ALIGN(((HFI_ALIGN(frame_width, LCU_MAX_SIZE_PELS) /\
  494. LCU_MIN_SIZE_PELS) * (HFI_ALIGN(frame_height, \
  495. LCU_MAX_SIZE_PELS) / LCU_MIN_SIZE_PELS)) * \
  496. NUM_HW_PIC_BUF, VENUS_DMA_ALIGNMENT); \
  497. _size = MIN(_size, H265D_MAX_SLICE + 1); \
  498. _size = HFI_ALIGN(_size, 4); \
  499. _size = 2 * _size * SIZE_H265D_VPP_CMD_PER_BUF; \
  500. if (_size > VPP_CMD_MAX_SIZE) \
  501. { \
  502. _size = VPP_CMD_MAX_SIZE; \
  503. } \
  504. } while (0)
  505. #define HFI_BUFFER_COMV_H265D(_size, frame_width, frame_height, \
  506. _yuv_bufcount_min) \
  507. do \
  508. { \
  509. _size = HFI_ALIGN(((((frame_width + 15) >> 4) * \
  510. ((frame_height + 15) >> 4)) << 8), \
  511. BUFFER_ALIGNMENT_512_BYTES); \
  512. _size *= _yuv_bufcount_min; \
  513. _size += BUFFER_ALIGNMENT_512_BYTES; \
  514. } while (0)
  515. #define HDR10_HIST_EXTRADATA_SIZE (4 * 1024)
  516. #define HFI_BUFFER_NON_COMV_H265D(_size, frame_width, frame_height, \
  517. num_vpp_pipes) \
  518. do \
  519. { \
  520. HFI_U32 _size_bse, _size_vpp; \
  521. SIZE_H265D_BSE_CMD_BUF(_size_bse, frame_width, \
  522. frame_height); \
  523. SIZE_H265D_VPP_CMD_BUF(_size_vpp, frame_width, \
  524. frame_height); \
  525. _size = HFI_ALIGN(_size_bse, VENUS_DMA_ALIGNMENT) + \
  526. HFI_ALIGN(_size_vpp, VENUS_DMA_ALIGNMENT) + \
  527. HFI_ALIGN(NUM_HW_PIC_BUF * 20 * 22 * 4, \
  528. VENUS_DMA_ALIGNMENT) + \
  529. HFI_ALIGN(2 * sizeof(HFI_U16) * \
  530. (HFI_ALIGN(frame_width, LCU_MAX_SIZE_PELS) / \
  531. LCU_MIN_SIZE_PELS) * (HFI_ALIGN(frame_height, \
  532. LCU_MAX_SIZE_PELS) / LCU_MIN_SIZE_PELS), \
  533. VENUS_DMA_ALIGNMENT) + \
  534. HFI_ALIGN(SIZE_HW_PIC(SIZE_H265D_HW_PIC_T), \
  535. VENUS_DMA_ALIGNMENT) + \
  536. HDR10_HIST_EXTRADATA_SIZE; \
  537. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  538. } while (0)
  539. #define HFI_BUFFER_LINE_H265D(_size, frame_width, frame_height, \
  540. is_opb, num_vpp_pipes) \
  541. do \
  542. { \
  543. HFI_U32 vpss_lb_size = 0; \
  544. _size = HFI_ALIGN(SIZE_H265D_LB_FE_TOP_DATA(frame_width, \
  545. frame_height), VENUS_DMA_ALIGNMENT) + \
  546. HFI_ALIGN(SIZE_H265D_LB_FE_TOP_CTRL(frame_width, \
  547. frame_height), VENUS_DMA_ALIGNMENT) + \
  548. HFI_ALIGN(SIZE_H265D_LB_FE_LEFT_CTRL(frame_width, \
  549. frame_height), VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  550. HFI_ALIGN(SIZE_H265D_LB_SE_LEFT_CTRL(frame_width, \
  551. frame_height), VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  552. HFI_ALIGN(SIZE_H265D_LB_SE_TOP_CTRL(frame_width, \
  553. frame_height), VENUS_DMA_ALIGNMENT) + \
  554. HFI_ALIGN(SIZE_H265D_LB_PE_TOP_DATA(frame_width, \
  555. frame_height), VENUS_DMA_ALIGNMENT) + \
  556. HFI_ALIGN(SIZE_H265D_LB_VSP_TOP(frame_width, \
  557. frame_height), VENUS_DMA_ALIGNMENT) + \
  558. HFI_ALIGN(SIZE_H265D_LB_VSP_LEFT(frame_width, \
  559. frame_height), VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  560. HFI_ALIGN(SIZE_H265D_LB_RECON_DMA_METADATA_WR\
  561. (frame_width, frame_height), \
  562. VENUS_DMA_ALIGNMENT) * 4 + \
  563. HFI_ALIGN(SIZE_H265D_QP(frame_width, frame_height),\
  564. VENUS_DMA_ALIGNMENT); \
  565. if (is_opb) \
  566. { \
  567. SIZE_VPSS_LB(vpss_lb_size, frame_width, frame_height,\
  568. num_vpp_pipes); \
  569. } \
  570. _size = HFI_ALIGN((_size + vpss_lb_size), \
  571. VENUS_DMA_ALIGNMENT); \
  572. } while (0)
  573. #define H265_CABAC_HDR_RATIO_HD_TOT 2
  574. #define H265_CABAC_RES_RATIO_HD_TOT 2
  575. #define SIZE_H265D_HW_BIN_BUFFER(_size, frame_width, frame_height, \
  576. delay, num_vpp_pipes) \
  577. do \
  578. { \
  579. HFI_U32 size_yuv, size_bin_hdr, size_bin_res; \
  580. size_yuv = ((frame_width * frame_height) <= \
  581. BIN_BUFFER_THRESHOLD) ? \
  582. ((BIN_BUFFER_THRESHOLD * 3) >> 1) : \
  583. ((frame_width * frame_height * 3) >> 1); \
  584. size_bin_hdr = size_yuv * H265_CABAC_HDR_RATIO_HD_TOT; \
  585. size_bin_res = size_yuv * H265_CABAC_RES_RATIO_HD_TOT; \
  586. size_bin_hdr = size_bin_hdr * \
  587. (((((HFI_U32)(delay)) & 31) / 10) + 2) / 2; \
  588. size_bin_res = size_bin_res * \
  589. (((((HFI_U32)(delay)) & 31) / 10) + 2) / 2; \
  590. size_bin_hdr = HFI_ALIGN(size_bin_hdr / \
  591. num_vpp_pipes, VENUS_DMA_ALIGNMENT) * \
  592. num_vpp_pipes; \
  593. size_bin_res = HFI_ALIGN(size_bin_res / num_vpp_pipes,\
  594. VENUS_DMA_ALIGNMENT) * num_vpp_pipes; \
  595. _size = size_bin_hdr + size_bin_res; \
  596. } while (0)
  597. #define HFI_BUFFER_BIN_H265D(_size, frame_width, frame_height, \
  598. is_interlaced, delay, num_vpp_pipes) \
  599. do \
  600. { \
  601. HFI_U32 n_aligned_w = HFI_ALIGN(frame_width, \
  602. BUFFER_ALIGNMENT_16_BYTES); \
  603. HFI_U32 n_aligned_h = HFI_ALIGN(frame_height, \
  604. BUFFER_ALIGNMENT_16_BYTES); \
  605. if (!is_interlaced) \
  606. { \
  607. SIZE_H265D_HW_BIN_BUFFER(_size, n_aligned_w, \
  608. n_aligned_h, delay, num_vpp_pipes); \
  609. } \
  610. else \
  611. { \
  612. _size = 0; \
  613. } \
  614. } while (0)
  615. #define SIZE_SLIST_BUF_H265 (1 << 10)
  616. #define NUM_SLIST_BUF_H265 (80 + 20)
  617. #define H265_NUM_TILE_COL 32
  618. #define H265_NUM_TILE_ROW 128
  619. #define H265_NUM_TILE (H265_NUM_TILE_ROW * H265_NUM_TILE_COL + 1)
  620. #define HFI_BUFFER_PERSIST_H265D(_size) \
  621. _size = HFI_ALIGN((SIZE_SLIST_BUF_H265 * NUM_SLIST_BUF_H265 + \
  622. H265_NUM_TILE * sizeof(HFI_U32) + NUM_HW_PIC_BUF * SIZE_SEI_USERDATA),\
  623. VENUS_DMA_ALIGNMENT)
  624. #define SIZE_VPXD_LB_FE_LEFT_CTRL(frame_width, frame_height) \
  625. MAX(((frame_height + 15) >> 4) * \
  626. MAX_FE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE, \
  627. MAX(((frame_height + 31) >> 5) * \
  628. MAX_FE_NBR_CTRL_LCU32_LINE_BUFFER_SIZE, \
  629. ((frame_height + 63) >> 6) * MAX_FE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE))
  630. #define SIZE_VPXD_LB_FE_TOP_CTRL(frame_width, frame_height) \
  631. (((HFI_ALIGN(frame_width, 64) + 8) * 10 * 2))
  632. #define SIZE_VPXD_LB_SE_TOP_CTRL(frame_width, frame_height) \
  633. (((frame_width + 15) >> 4) * MAX_FE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE)
  634. #define SIZE_VPXD_LB_SE_LEFT_CTRL(frame_width, frame_height) \
  635. MAX(((frame_height + 15) >> 4) * \
  636. MAX_SE_NBR_CTRL_LCU16_LINE_BUFFER_SIZE,\
  637. MAX(((frame_height + 31) >> 5) * \
  638. MAX_SE_NBR_CTRL_LCU32_LINE_BUFFER_SIZE, \
  639. ((frame_height + 63) >> 6) * MAX_SE_NBR_CTRL_LCU64_LINE_BUFFER_SIZE))
  640. #define SIZE_VPXD_LB_RECON_DMA_METADATA_WR(frame_width, frame_height) \
  641. HFI_ALIGN((HFI_ALIGN(frame_height, 8) / (4 / 2)) * 64,\
  642. BUFFER_ALIGNMENT_32_BYTES)
  643. #define SIZE_MP2D_LB_FE_TOP_DATA(frame_width, frame_height) \
  644. ((HFI_ALIGN(frame_width, 16) + 8) * 10 * 2)
  645. #define SIZE_VP9D_LB_FE_TOP_DATA(frame_width, frame_height) \
  646. ((HFI_ALIGN(HFI_ALIGN(frame_width, 8), 64) + 8) * 10 * 2)
  647. #define SIZE_MP2D_LB_PE_TOP_DATA(frame_width, frame_height) \
  648. ((HFI_ALIGN(frame_width, 16) >> 4) * 64)
  649. #define SIZE_VP9D_LB_PE_TOP_DATA(frame_width, frame_height) \
  650. ((HFI_ALIGN(HFI_ALIGN(frame_width, 8), 64) >> 6) * 176)
  651. #define SIZE_MP2D_LB_VSP_TOP(frame_width, frame_height) \
  652. (((HFI_ALIGN(frame_width, 16) >> 4) * 64 / 2) + 256)
  653. #define SIZE_VP9D_LB_VSP_TOP(frame_width, frame_height) \
  654. ((((HFI_ALIGN(HFI_ALIGN(frame_width, 8), 64) >> 6) * 64 * 8) + 256))
  655. #define HFI_IRIS2_VP9D_COMV_SIZE \
  656. ((((8192 + 63) >> 6) * ((4320 + 63) >> 6) * 8 * 8 * 2 * 8))
  657. #define SIZE_VP9D_QP(frame_width, frame_height) \
  658. SIZE_H264D_QP(frame_width, frame_height)
  659. #define HFI_IRIS2_VP9D_LB_SIZE(_size, frame_width, frame_height, num_vpp_pipes)\
  660. do \
  661. { \
  662. _size = HFI_ALIGN(SIZE_VPXD_LB_FE_LEFT_CTRL(frame_width, \
  663. frame_height),VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  664. HFI_ALIGN(SIZE_VPXD_LB_SE_LEFT_CTRL(frame_width, frame_height),\
  665. VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  666. HFI_ALIGN(SIZE_VP9D_LB_VSP_TOP(frame_width, frame_height), \
  667. VENUS_DMA_ALIGNMENT) + \
  668. HFI_ALIGN(SIZE_VPXD_LB_FE_TOP_CTRL(frame_width, frame_height), \
  669. VENUS_DMA_ALIGNMENT) + 2 * \
  670. HFI_ALIGN(SIZE_VPXD_LB_RECON_DMA_METADATA_WR \
  671. (frame_width, frame_height), VENUS_DMA_ALIGNMENT) + \
  672. HFI_ALIGN(SIZE_VPXD_LB_SE_TOP_CTRL(frame_width, frame_height), \
  673. VENUS_DMA_ALIGNMENT) + \
  674. HFI_ALIGN(SIZE_VP9D_LB_PE_TOP_DATA(frame_width, frame_height), \
  675. VENUS_DMA_ALIGNMENT) + \
  676. HFI_ALIGN(SIZE_VP9D_LB_FE_TOP_DATA(frame_width, frame_height), \
  677. VENUS_DMA_ALIGNMENT) + \
  678. HFI_ALIGN(SIZE_VP9D_QP(frame_width, frame_height), \
  679. VENUS_DMA_ALIGNMENT); \
  680. } while (0)
  681. #define HFI_BUFFER_LINE_VP9D(_size, frame_width, frame_height, \
  682. _yuv_bufcount_min, is_opb, num_vpp_pipes) \
  683. do \
  684. { \
  685. HFI_U32 _lb_size = 0; \
  686. HFI_U32 vpss_lb_size = 0; \
  687. HFI_IRIS2_VP9D_LB_SIZE(_lb_size, frame_width, frame_height,\
  688. num_vpp_pipes); \
  689. if (is_opb) \
  690. { \
  691. SIZE_VPSS_LB(vpss_lb_size, frame_width, frame_height, \
  692. num_vpp_pipes); \
  693. } \
  694. _size = _lb_size + vpss_lb_size; \
  695. } while (0)
  696. #define VPX_DECODER_FRAME_CONCURENCY_LVL (2)
  697. #define VPX_DECODER_FRAME_BIN_HDR_BUDGET_RATIO 1 / 2
  698. #define VPX_DECODER_FRAME_BIN_RES_BUDGET_RATIO 3 / 2
  699. #define HFI_BUFFER_BIN_VP9D(_size, frame_width, frame_height, \
  700. is_interlaced, num_vpp_pipes) \
  701. do \
  702. { \
  703. HFI_U32 _size_yuv = HFI_ALIGN(frame_width, \
  704. BUFFER_ALIGNMENT_16_BYTES) *\
  705. HFI_ALIGN(frame_height, BUFFER_ALIGNMENT_16_BYTES) * 3 / 2; \
  706. if (!is_interlaced) \
  707. { \
  708. _size = HFI_ALIGN(((MAX(_size_yuv, \
  709. ((BIN_BUFFER_THRESHOLD * 3) >> 1)) * \
  710. VPX_DECODER_FRAME_BIN_HDR_BUDGET_RATIO * \
  711. VPX_DECODER_FRAME_CONCURENCY_LVL) / num_vpp_pipes), \
  712. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(((MAX(_size_yuv, \
  713. ((BIN_BUFFER_THRESHOLD * 3) >> 1)) * \
  714. VPX_DECODER_FRAME_BIN_RES_BUDGET_RATIO * \
  715. VPX_DECODER_FRAME_CONCURENCY_LVL) / num_vpp_pipes), \
  716. VENUS_DMA_ALIGNMENT); \
  717. _size = _size * num_vpp_pipes; \
  718. } \
  719. else \
  720. { \
  721. _size = 0; \
  722. } \
  723. } while (0)
  724. #define VP9_NUM_FRAME_INFO_BUF 32
  725. #define VP9_NUM_PROBABILITY_TABLE_BUF (VP9_NUM_FRAME_INFO_BUF + 4)
  726. #define VP9_PROB_TABLE_SIZE (3840)
  727. #define VP9_UDC_HEADER_BUF_SIZE (3 * 128)
  728. #define MAX_SUPERFRAME_HEADER_LEN (34)
  729. #define CCE_TILE_OFFSET_SIZE HFI_ALIGN(32 * 4 * 4, BUFFER_ALIGNMENT_32_BYTES)
  730. #define HFI_BUFFER_PERSIST_VP9D(_size) \
  731. _size = HFI_ALIGN(VP9_NUM_PROBABILITY_TABLE_BUF * VP9_PROB_TABLE_SIZE, \
  732. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(HFI_IRIS2_VP9D_COMV_SIZE, \
  733. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(MAX_SUPERFRAME_HEADER_LEN, \
  734. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(VP9_UDC_HEADER_BUF_SIZE, \
  735. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(VP9_NUM_FRAME_INFO_BUF * \
  736. CCE_TILE_OFFSET_SIZE, VENUS_DMA_ALIGNMENT) + \
  737. HDR10_HIST_EXTRADATA_SIZE
  738. #define HFI_BUFFER_LINE_MP2D(_size, frame_width, frame_height, \
  739. _yuv_bufcount_min, is_opb, num_vpp_pipes) \
  740. do \
  741. { \
  742. HFI_U32 vpss_lb_size = 0; \
  743. _size = HFI_ALIGN(SIZE_VPXD_LB_FE_LEFT_CTRL(frame_width, \
  744. frame_height), VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  745. HFI_ALIGN(SIZE_VPXD_LB_SE_LEFT_CTRL(frame_width, frame_height),\
  746. VENUS_DMA_ALIGNMENT) * num_vpp_pipes + \
  747. HFI_ALIGN(SIZE_MP2D_LB_VSP_TOP(frame_width, frame_height),\
  748. VENUS_DMA_ALIGNMENT) + HFI_ALIGN(SIZE_VPXD_LB_FE_TOP_CTRL\
  749. (frame_width, frame_height), VENUS_DMA_ALIGNMENT) + \
  750. 2 * HFI_ALIGN(SIZE_VPXD_LB_RECON_DMA_METADATA_WR(frame_width,\
  751. frame_height), VENUS_DMA_ALIGNMENT) + \
  752. HFI_ALIGN(SIZE_VPXD_LB_SE_TOP_CTRL(frame_width, frame_height),\
  753. VENUS_DMA_ALIGNMENT) + \
  754. HFI_ALIGN(SIZE_MP2D_LB_PE_TOP_DATA(frame_width, frame_height), \
  755. VENUS_DMA_ALIGNMENT) + \
  756. HFI_ALIGN(SIZE_MP2D_LB_FE_TOP_DATA(frame_width, frame_height), \
  757. VENUS_DMA_ALIGNMENT); \
  758. if (is_opb) \
  759. { \
  760. SIZE_VPSS_LB(vpss_lb_size, frame_width, frame_height, \
  761. num_vpp_pipes); \
  762. } \
  763. _size += vpss_lb_size; \
  764. } while (0)
  765. #define HFI_BUFFER_BIN_MP2D(_size, frame_width, frame_height, is_interlaced) 0
  766. #define QMATRIX_SIZE (sizeof(HFI_U32) * 128 + 256)
  767. #define MP2D_QPDUMP_SIZE 115200
  768. #define HFI_BUFFER_PERSIST_MP2D(_size) \
  769. _size = QMATRIX_SIZE + MP2D_QPDUMP_SIZE;
  770. #define HFI_BUFFER_BITSTREAM_ENC(size, frame_width, frame_height, \
  771. rc_type, is_ten_bit) \
  772. do \
  773. { \
  774. HFI_U32 aligned_width, aligned_height, bitstream_size; \
  775. aligned_width = HFI_ALIGN(frame_width, 32); \
  776. aligned_height = HFI_ALIGN(frame_height, 32); \
  777. bitstream_size = aligned_width * aligned_height * 3; \
  778. if (aligned_width * aligned_height > (4096 * 2176)) \
  779. { \
  780. bitstream_size = (bitstream_size >> 3); \
  781. } \
  782. else if (bitstream_size > (1280 * 720)) \
  783. { \
  784. bitstream_size = (bitstream_size >> 2); \
  785. } \
  786. else \
  787. { \
  788. bitstream_size = (bitstream_size << 1);\
  789. } \
  790. if ((rc_type == HFI_RC_CQ) || (rc_type == HFI_RC_OFF)) \
  791. { \
  792. bitstream_size = (bitstream_size << 1);\
  793. } \
  794. if (is_ten_bit) \
  795. { \
  796. bitstream_size = (bitstream_size) + \
  797. (bitstream_size >> 2); \
  798. } \
  799. size = HFI_ALIGN(bitstream_size, HFI_ALIGNMENT_4096); \
  800. } while (0)
  801. #define SIZE_ROI_METADATA_ENC(size_roi, frame_width, frame_height, lcu_size)\
  802. do \
  803. { \
  804. HFI_U32 width_in_lcus = 0, height_in_lcus = 0, n_shift = 0; \
  805. while (lcu_size && !(lcu_size & 0x1)) \
  806. { \
  807. n_shift++; \
  808. lcu_size = lcu_size >> 1; \
  809. } \
  810. width_in_lcus = (frame_width + (lcu_size - 1)) >> n_shift; \
  811. height_in_lcus = (frame_height + (lcu_size - 1)) >> n_shift; \
  812. size_roi = (((width_in_lcus + 7) >> 3) << 3) * \
  813. height_in_lcus * 2 + 256; \
  814. } while (0)
  815. #define HFI_BUFFER_INPUT_METADATA_ENC(size, frame_width, frame_height, \
  816. is_roi_enabled, lcu_size) \
  817. do \
  818. { \
  819. HFI_U32 roi_size = 0; \
  820. if (is_roi_enabled) \
  821. { \
  822. SIZE_ROI_METADATA_ENC(roi_size, frame_width, \
  823. frame_height, lcu_size); \
  824. } \
  825. size = roi_size + 16384; \
  826. size = HFI_ALIGN(size, HFI_ALIGNMENT_4096); \
  827. } while (0)
  828. #define HFI_BUFFER_INPUT_METADATA_H264E(size_metadata, frame_width, \
  829. frame_height, is_roi_enabled) \
  830. do \
  831. { \
  832. HFI_BUFFER_INPUT_METADATA_ENC(size_metadata, frame_width, \
  833. frame_height, is_roi_enabled, 16); \
  834. }while (0)
  835. #define HFI_BUFFER_INPUT_METADATA_H265E(size_metadata, frame_width, \
  836. frame_height, is_roi_enabled) \
  837. do \
  838. { \
  839. HFI_BUFFER_INPUT_METADATA_ENC(size_metadata, frame_width, \
  840. frame_height, is_roi_enabled, 32); \
  841. } while (0)
  842. #define HFI_BUFFER_ARP_ENC(size) \
  843. do \
  844. { \
  845. size = 204800; \
  846. } while (0)
  847. #define HFI_MAX_COL_FRAME 6
  848. #define HFI_VENUS_VENC_TRE_WB_BUFF_SIZE (65 << 4) // bytes
  849. #define HFI_VENUS_VENC_DB_LINE_BUFF_PER_MB 512
  850. #define HFI_VENUS_VPPSG_MAX_REGISTERS 2048
  851. #define HFI_VENUS_WIDTH_ALIGNMENT 128
  852. #define HFI_VENUS_WIDTH_TEN_BIT_ALIGNMENT 192
  853. #define HFI_VENUS_HEIGHT_ALIGNMENT 32
  854. #define VENUS_METADATA_STRIDE_MULTIPLE 64
  855. #define VENUS_METADATA_HEIGHT_MULTIPLE 16
  856. #ifndef SYSTEM_LAL_TILE10
  857. #define SYSTEM_LAL_TILE10 192
  858. #endif
  859. #define HFI_IRIS2_ENC_RECON_BUF_COUNT(num_recon, n_bframe, ltr_count, \
  860. _total_hp_layers, _total_hb_layers, hybrid_hp, codec_standard) \
  861. do \
  862. { \
  863. HFI_U32 num_ref = 1; \
  864. if (n_bframe) \
  865. num_ref = 2; \
  866. if (_total_hp_layers > 1) \
  867. { \
  868. if (hybrid_hp) \
  869. num_ref = (_total_hp_layers + 1) >> 1; \
  870. else if (codec_standard == HFI_CODEC_ENCODE_HEVC) \
  871. num_ref = (_total_hp_layers + 1) >> 1; \
  872. else if (codec_standard == HFI_CODEC_ENCODE_AVC && \
  873. _total_hp_layers < 4) \
  874. num_ref = (_total_hp_layers - 1); \
  875. else \
  876. num_ref = _total_hp_layers; \
  877. } \
  878. if (ltr_count) \
  879. num_ref = num_ref + ltr_count; \
  880. if (_total_hb_layers > 1) \
  881. { \
  882. if (codec_standard == HFI_CODEC_ENCODE_HEVC) \
  883. num_ref = (_total_hb_layers); \
  884. else if (codec_standard == HFI_CODEC_ENCODE_AVC) \
  885. num_ref = (1 << (_total_hb_layers - 2)) + 1; \
  886. } \
  887. num_recon = num_ref + 1; \
  888. } while (0)
  889. #define SIZE_BIN_BITSTREAM_ENC(_size, rc_type, frame_width, frame_height, \
  890. work_mode, lcu_size) \
  891. do \
  892. { \
  893. HFI_U32 size_aligned_width = 0, size_aligned_height = 0; \
  894. HFI_U32 bitstream_size_eval = 0; \
  895. size_aligned_width = HFI_ALIGN((frame_width), lcu_size); \
  896. size_aligned_height = HFI_ALIGN((frame_height), lcu_size); \
  897. if (work_mode == HFI_WORKMODE_2) \
  898. { \
  899. if ((rc_type == HFI_RC_CQ) || (rc_type == HFI_RC_OFF)) \
  900. { \
  901. bitstream_size_eval = (((size_aligned_width) * \
  902. (size_aligned_height) * 3) >> 1); \
  903. } \
  904. else \
  905. { \
  906. bitstream_size_eval = ((size_aligned_width) * \
  907. (size_aligned_height) * 3); \
  908. if (rc_type == HFI_RC_LOSSLESS) \
  909. { \
  910. bitstream_size_eval = (bitstream_size_eval * 3 >> 2); \
  911. } \
  912. else if ((size_aligned_width * size_aligned_height) > \
  913. (4096 * 2176)) \
  914. { \
  915. bitstream_size_eval >>= 3; \
  916. } \
  917. else if ((size_aligned_width * size_aligned_height) > (480 * 320)) \
  918. { \
  919. bitstream_size_eval >>= 2; \
  920. } \
  921. if (lcu_size == 32) \
  922. { \
  923. bitstream_size_eval = (bitstream_size_eval * 5 >> 2); \
  924. } \
  925. } \
  926. } \
  927. else \
  928. { \
  929. bitstream_size_eval = size_aligned_width * \
  930. size_aligned_height * 3; \
  931. } \
  932. _size = HFI_ALIGN(bitstream_size_eval, VENUS_DMA_ALIGNMENT); \
  933. } while (0)
  934. #define SIZE_ENC_SINGLE_PIPE(size, rc_type, bitbin_size, num_vpp_pipes, \
  935. frame_width, frame_height, lcu_size) \
  936. do \
  937. { \
  938. HFI_U32 size_single_pipe_eval = 0, sao_bin_buffer_size = 0, \
  939. _padded_bin_sz = 0; \
  940. HFI_U32 size_aligned_width = 0, size_aligned_height = 0; \
  941. size_aligned_width = HFI_ALIGN((frame_width), lcu_size); \
  942. size_aligned_height = HFI_ALIGN((frame_height), lcu_size); \
  943. if ((size_aligned_width * size_aligned_height) > \
  944. (3840 * 2160)) \
  945. { \
  946. size_single_pipe_eval = (bitbin_size / num_vpp_pipes); \
  947. } \
  948. else if (num_vpp_pipes > 2) \
  949. { \
  950. size_single_pipe_eval = bitbin_size / 2; \
  951. } \
  952. else \
  953. { \
  954. size_single_pipe_eval = bitbin_size; \
  955. } \
  956. if (rc_type == HFI_RC_LOSSLESS) \
  957. { \
  958. size_single_pipe_eval = (size_single_pipe_eval << 1); \
  959. } \
  960. sao_bin_buffer_size = (64 * ((((frame_width) + \
  961. BUFFER_ALIGNMENT_32_BYTES) * ((frame_height) +\
  962. BUFFER_ALIGNMENT_32_BYTES)) >> 10)) + 384; \
  963. _padded_bin_sz = HFI_ALIGN(size_single_pipe_eval, \
  964. VENUS_DMA_ALIGNMENT);\
  965. size_single_pipe_eval = sao_bin_buffer_size + _padded_bin_sz; \
  966. size_single_pipe_eval = HFI_ALIGN(size_single_pipe_eval, \
  967. VENUS_DMA_ALIGNMENT); \
  968. size = size_single_pipe_eval; \
  969. } while (0)
  970. #define HFI_BUFFER_BIN_ENC(_size, rc_type, frame_width, frame_height, lcu_size, \
  971. work_mode, num_vpp_pipes) \
  972. do \
  973. { \
  974. HFI_U32 bitstream_size = 0, total_bitbin_buffers = 0, \
  975. size_single_pipe = 0, bitbin_size = 0; \
  976. SIZE_BIN_BITSTREAM_ENC(bitstream_size, rc_type, frame_width, \
  977. frame_height, work_mode, lcu_size); \
  978. if (work_mode == HFI_WORKMODE_2) \
  979. { \
  980. total_bitbin_buffers = 3; \
  981. bitbin_size = bitstream_size * 17 / 10; \
  982. bitbin_size = HFI_ALIGN(bitbin_size, \
  983. VENUS_DMA_ALIGNMENT); \
  984. } \
  985. else if ((lcu_size == 16) || (num_vpp_pipes > 1)) \
  986. { \
  987. total_bitbin_buffers = 1; \
  988. bitbin_size = bitstream_size; \
  989. } \
  990. if (total_bitbin_buffers > 0) \
  991. { \
  992. SIZE_ENC_SINGLE_PIPE(size_single_pipe, rc_type, bitbin_size, \
  993. num_vpp_pipes, frame_width, frame_height, lcu_size); \
  994. bitbin_size = size_single_pipe * num_vpp_pipes; \
  995. _size = HFI_ALIGN(bitbin_size, VENUS_DMA_ALIGNMENT) * \
  996. total_bitbin_buffers + 512; \
  997. } \
  998. else \
  999. /* Avoid 512 Bytes allocation in case of 1Pipe HEVC Direct Mode*/\
  1000. { \
  1001. _size = 0; \
  1002. } \
  1003. } while (0)
  1004. #define HFI_BUFFER_BIN_H264E(_size, rc_type, frame_width, frame_height, \
  1005. work_mode, num_vpp_pipes) \
  1006. do \
  1007. { \
  1008. HFI_BUFFER_BIN_ENC(_size, rc_type, frame_width, frame_height, 16, \
  1009. work_mode, num_vpp_pipes); \
  1010. } while (0)
  1011. #define HFI_BUFFER_BIN_H265E(_size, rc_type, frame_width, frame_height, \
  1012. work_mode, num_vpp_pipes) \
  1013. do \
  1014. { \
  1015. HFI_BUFFER_BIN_ENC(_size, rc_type, frame_width, frame_height, 32,\
  1016. work_mode, num_vpp_pipes); \
  1017. } while (0)
  1018. #define SIZE_ENC_SLICE_INFO_BUF(num_lcu_in_frame) HFI_ALIGN((256 + \
  1019. (num_lcu_in_frame << 4)), VENUS_DMA_ALIGNMENT)
  1020. #define SIZE_LINE_BUF_CTRL(frame_width_coded) \
  1021. HFI_ALIGN(frame_width_coded, VENUS_DMA_ALIGNMENT)
  1022. #define SIZE_LINE_BUF_CTRL_ID2(frame_width_coded) \
  1023. HFI_ALIGN(frame_width_coded, VENUS_DMA_ALIGNMENT)
  1024. #define SIZE_LINEBUFF_DATA(_size, is_ten_bit, frame_width_coded) \
  1025. do \
  1026. { \
  1027. _size = is_ten_bit ? (((((10 * (frame_width_coded) +\
  1028. 1024) + (VENUS_DMA_ALIGNMENT - 1)) & \
  1029. (~(VENUS_DMA_ALIGNMENT - 1))) * 1) + \
  1030. (((((10 * (frame_width_coded) + 1024) >> 1) + \
  1031. (VENUS_DMA_ALIGNMENT - 1)) & (~(VENUS_DMA_ALIGNMENT - 1))) * \
  1032. 2)) : (((((8 * (frame_width_coded) + 1024) + \
  1033. (VENUS_DMA_ALIGNMENT - 1)) \
  1034. & (~(VENUS_DMA_ALIGNMENT - 1))) * 1) + \
  1035. (((((8 * (frame_width_coded) +\
  1036. 1024) >> 1) + (VENUS_DMA_ALIGNMENT - 1)) & \
  1037. (~(VENUS_DMA_ALIGNMENT - 1))) * 2)); \
  1038. } while (0)
  1039. #define SIZE_LEFT_LINEBUFF_CTRL(_size, standard, frame_height_coded, \
  1040. num_vpp_pipes_enc) \
  1041. do \
  1042. { \
  1043. _size = (standard == HFI_CODEC_ENCODE_HEVC) ? \
  1044. (((frame_height_coded) + \
  1045. (BUF_SIZE_ALIGN_32)) / BUF_SIZE_ALIGN_32 * 4 * 16) : \
  1046. (((frame_height_coded) + 15) / 16 * 5 * 16); \
  1047. if ((num_vpp_pipes_enc) > 1) \
  1048. { \
  1049. _size += BUFFER_ALIGNMENT_512_BYTES; \
  1050. _size = HFI_ALIGN(_size, BUFFER_ALIGNMENT_512_BYTES) *\
  1051. (num_vpp_pipes_enc); \
  1052. } \
  1053. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  1054. } while (0)
  1055. #define SIZE_LEFT_LINEBUFF_RECON_PIX(_size, is_ten_bit, frame_height_coded, \
  1056. num_vpp_pipes_enc) \
  1057. do \
  1058. { \
  1059. _size = (((is_ten_bit + 1) * 2 * (frame_height_coded) + \
  1060. VENUS_DMA_ALIGNMENT) + \
  1061. (VENUS_DMA_ALIGNMENT << (num_vpp_pipes_enc - 1)) - 1) & \
  1062. (~((VENUS_DMA_ALIGNMENT << (num_vpp_pipes_enc - 1)) - 1)) * 1; \
  1063. } while (0)
  1064. #define SIZE_TOP_LINEBUFF_CTRL_FE(_size, frame_width_coded, standard) \
  1065. do \
  1066. { \
  1067. _size = (standard == HFI_CODEC_ENCODE_HEVC) ? (64 * \
  1068. ((frame_width_coded) >> 5)) : (VENUS_DMA_ALIGNMENT + 16 * \
  1069. ((frame_width_coded) >> 4)); \
  1070. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  1071. } while (0)
  1072. #define SIZE_LEFT_LINEBUFF_CTRL_FE(frame_height_coded, num_vpp_pipes_enc) \
  1073. ((((VENUS_DMA_ALIGNMENT + 64 * ((frame_height_coded) >> 4)) + \
  1074. (VENUS_DMA_ALIGNMENT << (num_vpp_pipes_enc - 1)) - 1) & \
  1075. (~((VENUS_DMA_ALIGNMENT << (num_vpp_pipes_enc - 1)) - 1)) * 1) * \
  1076. num_vpp_pipes_enc)
  1077. #define SIZE_LEFT_LINEBUFF_METADATA_RECON_Y(_size, frame_height_coded, \
  1078. is_ten_bit, num_vpp_pipes_enc) \
  1079. do \
  1080. { \
  1081. _size = ((VENUS_DMA_ALIGNMENT + 64 * ((frame_height_coded) / \
  1082. (8 * (is_ten_bit ? 4 : 8))))); \
  1083. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  1084. _size = (_size * num_vpp_pipes_enc); \
  1085. } while (0)
  1086. #define SIZE_LEFT_LINEBUFF_METADATA_RECON_UV(_size, frame_height_coded, \
  1087. is_ten_bit, num_vpp_pipes_enc) \
  1088. do \
  1089. { \
  1090. _size = ((VENUS_DMA_ALIGNMENT + 64 * ((frame_height_coded) / \
  1091. (4 * (is_ten_bit ? 4 : 8))))); \
  1092. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  1093. _size = (_size * num_vpp_pipes_enc); \
  1094. } while (0)
  1095. #define SIZE_LINEBUFF_RECON_PIX(_size, is_ten_bit, frame_width_coded) \
  1096. do \
  1097. { \
  1098. _size = ((is_ten_bit ? 3 : 2) * (frame_width_coded)); \
  1099. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT); \
  1100. } while (0)
  1101. #define SIZE_SLICE_CMD_BUFFER (HFI_ALIGN(20480, VENUS_DMA_ALIGNMENT))
  1102. #define SIZE_SPS_PPS_SLICE_HDR (2048 + 4096)
  1103. #define SIZE_FRAME_RC_BUF_SIZE(_size, standard, frame_height_coded, \
  1104. num_vpp_pipes_enc) \
  1105. do \
  1106. { \
  1107. _size = (standard == HFI_CODEC_ENCODE_HEVC) ? (256 + 16 * \
  1108. (14 + ((((frame_height_coded) >> 5) + 7) >> 3))) : \
  1109. (256 + 16 * (14 + ((((frame_height_coded) >> 4) + 7) >> 3))); \
  1110. _size *= 6; \
  1111. if (num_vpp_pipes_enc > 1) \
  1112. { \
  1113. _size = HFI_ALIGN(_size, VENUS_DMA_ALIGNMENT) * \
  1114. num_vpp_pipes_enc;\
  1115. } \
  1116. _size = HFI_ALIGN(_size, BUFFER_ALIGNMENT_512_BYTES) * \
  1117. HFI_MAX_COL_FRAME; \
  1118. } while (0)
  1119. #define ENC_BITCNT_BUF_SIZE(num_lcu_in_frame) HFI_ALIGN((256 + \
  1120. (4 * (num_lcu_in_frame))), VENUS_DMA_ALIGNMENT)
  1121. #define ENC_BITMAP_BUF_SIZE(num_lcu_in_frame) HFI_ALIGN((256 + \
  1122. ((num_lcu_in_frame) >> 3)), VENUS_DMA_ALIGNMENT)
  1123. #define SIZE_LINE_BUF_SDE(frame_width_coded) HFI_ALIGN((256 + \
  1124. (16 * ((frame_width_coded) >> 4))), VENUS_DMA_ALIGNMENT)
  1125. #define SIZE_BSE_SLICE_CMD_BUF ((((8192 << 2) + 7) & (~7)) * 6)
  1126. #define SIZE_BSE_REG_BUF ((((512 << 3) + 7) & (~7)) * 4)
  1127. #define SIZE_VPP_REG_BUF ((((HFI_VENUS_VPPSG_MAX_REGISTERS << 3) +\
  1128. 31) & (~31)) * 10)
  1129. #define SIZE_LAMBDA_LUT (256 * 11)
  1130. #define SIZE_OVERRIDE_BUF(num_lcumb) (HFI_ALIGN(((16 * (((num_lcumb) + 7)\
  1131. >> 3))), VENUS_DMA_ALIGNMENT) * 2)
  1132. #define SIZE_IR_BUF(num_lcu_in_frame) HFI_ALIGN((((((num_lcu_in_frame) << 1) + 7) &\
  1133. (~7)) * 3), VENUS_DMA_ALIGNMENT)
  1134. #define SIZE_VPSS_LINE_BUF(num_vpp_pipes_enc, frame_height_coded, \
  1135. frame_width_coded) \
  1136. (HFI_ALIGN(((((((8192) >> 2) << 5) * (num_vpp_pipes_enc)) + 64) + \
  1137. (((((MAX((frame_width_coded), (frame_height_coded)) + 3) >> 2) << 5) +\
  1138. 256) * 16)), VENUS_DMA_ALIGNMENT))
  1139. #define SIZE_TOP_LINE_BUF_FIRST_STG_SAO(frame_width_coded) \
  1140. HFI_ALIGN((16 * ((frame_width_coded) >> 5)), VENUS_DMA_ALIGNMENT)
  1141. #define HFI_BUFFER_LINE_ENC(_size, frame_width, frame_height, is_ten_bit, \
  1142. num_vpp_pipes_enc, lcu_size, standard) \
  1143. do \
  1144. { \
  1145. HFI_U32 width_in_lcus = 0, height_in_lcus = 0, \
  1146. frame_width_coded = 0, frame_height_coded = 0; \
  1147. HFI_U32 line_buff_data_size = 0, left_line_buff_ctrl_size = 0, \
  1148. left_line_buff_recon_pix_size = 0, \
  1149. top_line_buff_ctrl_fe_size = 0; \
  1150. HFI_U32 left_line_buff_metadata_recon__y__size = 0, \
  1151. left_line_buff_metadata_recon__uv__size = 0, \
  1152. line_buff_recon_pix_size = 0; \
  1153. width_in_lcus = ((frame_width) + (lcu_size)-1) / (lcu_size); \
  1154. height_in_lcus = ((frame_height) + (lcu_size)-1) / (lcu_size); \
  1155. frame_width_coded = width_in_lcus * (lcu_size); \
  1156. frame_height_coded = height_in_lcus * (lcu_size); \
  1157. SIZE_LINEBUFF_DATA(line_buff_data_size, is_ten_bit, \
  1158. frame_width_coded);\
  1159. SIZE_LEFT_LINEBUFF_CTRL(left_line_buff_ctrl_size, standard, \
  1160. frame_height_coded, num_vpp_pipes_enc); \
  1161. SIZE_LEFT_LINEBUFF_RECON_PIX(left_line_buff_recon_pix_size, \
  1162. is_ten_bit, frame_height_coded, num_vpp_pipes_enc); \
  1163. SIZE_TOP_LINEBUFF_CTRL_FE(top_line_buff_ctrl_fe_size, \
  1164. frame_width_coded, standard); \
  1165. SIZE_LEFT_LINEBUFF_METADATA_RECON_Y\
  1166. (left_line_buff_metadata_recon__y__size, \
  1167. frame_height_coded, is_ten_bit, num_vpp_pipes_enc); \
  1168. SIZE_LEFT_LINEBUFF_METADATA_RECON_UV\
  1169. (left_line_buff_metadata_recon__uv__size, \
  1170. frame_height_coded, is_ten_bit, num_vpp_pipes_enc); \
  1171. SIZE_LINEBUFF_RECON_PIX(line_buff_recon_pix_size, is_ten_bit,\
  1172. frame_width_coded); \
  1173. _size = SIZE_LINE_BUF_CTRL(frame_width_coded) + \
  1174. SIZE_LINE_BUF_CTRL_ID2(frame_width_coded) + \
  1175. line_buff_data_size + \
  1176. left_line_buff_ctrl_size + \
  1177. left_line_buff_recon_pix_size + \
  1178. top_line_buff_ctrl_fe_size + \
  1179. left_line_buff_metadata_recon__y__size + \
  1180. left_line_buff_metadata_recon__uv__size + \
  1181. line_buff_recon_pix_size + \
  1182. SIZE_LEFT_LINEBUFF_CTRL_FE(frame_height_coded, \
  1183. num_vpp_pipes_enc) + SIZE_LINE_BUF_SDE(frame_width_coded) + \
  1184. SIZE_VPSS_LINE_BUF(num_vpp_pipes_enc, frame_height_coded, \
  1185. frame_width_coded) + \
  1186. SIZE_TOP_LINE_BUF_FIRST_STG_SAO(frame_width_coded); \
  1187. } while (0)
  1188. #define HFI_BUFFER_LINE_H264E(_size, frame_width, frame_height, is_ten_bit, \
  1189. num_vpp_pipes) \
  1190. do \
  1191. { \
  1192. HFI_BUFFER_LINE_ENC(_size, frame_width, frame_height, 0, \
  1193. num_vpp_pipes, 16, HFI_CODEC_ENCODE_AVC); \
  1194. } while (0)
  1195. #define HFI_BUFFER_LINE_H265E(_size, frame_width, frame_height, is_ten_bit, \
  1196. num_vpp_pipes) \
  1197. do \
  1198. { \
  1199. HFI_BUFFER_LINE_ENC(_size, frame_width, frame_height, \
  1200. is_ten_bit, num_vpp_pipes, 32, HFI_CODEC_ENCODE_HEVC); \
  1201. } while (0)
  1202. #define HFI_BUFFER_COMV_ENC(_size, frame_width, frame_height, lcu_size, \
  1203. num_recon, standard) \
  1204. do \
  1205. { \
  1206. HFI_U32 size_colloc_mv = 0, size_colloc_rc = 0; \
  1207. HFI_U32 mb_width = ((frame_width) + 15) >> 4; \
  1208. HFI_U32 mb_height = ((frame_height) + 15) >> 4; \
  1209. HFI_U32 width_in_lcus = ((frame_width) + (lcu_size)-1) /\
  1210. (lcu_size); \
  1211. HFI_U32 height_in_lcus = ((frame_height) + (lcu_size)-1) / \
  1212. (lcu_size); \
  1213. HFI_U32 num_lcu_in_frame = width_in_lcus * height_in_lcus; \
  1214. size_colloc_mv = (standard == HFI_CODEC_ENCODE_HEVC) ? \
  1215. (16 * ((num_lcu_in_frame << 2) + BUFFER_ALIGNMENT_32_BYTES)) : \
  1216. (3 * 16 * (width_in_lcus * height_in_lcus +\
  1217. BUFFER_ALIGNMENT_32_BYTES)); \
  1218. size_colloc_mv = HFI_ALIGN(size_colloc_mv, \
  1219. VENUS_DMA_ALIGNMENT) * num_recon; \
  1220. size_colloc_rc = (((mb_width + 7) >> 3) * 16 * 2 * mb_height); \
  1221. size_colloc_rc = HFI_ALIGN(size_colloc_rc, \
  1222. VENUS_DMA_ALIGNMENT) * HFI_MAX_COL_FRAME; \
  1223. _size = size_colloc_mv + size_colloc_rc; \
  1224. } while (0)
  1225. #define HFI_BUFFER_COMV_H264E(_size, frame_width, frame_height, num_recon) \
  1226. do \
  1227. { \
  1228. HFI_BUFFER_COMV_ENC(_size, frame_width, frame_height, 16, \
  1229. num_recon, HFI_CODEC_ENCODE_AVC); \
  1230. } while (0)
  1231. #define HFI_BUFFER_COMV_H265E(_size, frame_width, frame_height, num_recon) \
  1232. do \
  1233. { \
  1234. HFI_BUFFER_COMV_ENC(_size, frame_width, frame_height, 32,\
  1235. num_recon, HFI_CODEC_ENCODE_HEVC); \
  1236. } while (0)
  1237. #define HFI_BUFFER_NON_COMV_ENC(_size, frame_width, frame_height, \
  1238. num_vpp_pipes_enc, lcu_size, standard) \
  1239. do \
  1240. { \
  1241. HFI_U32 width_in_lcus = 0, height_in_lcus = 0, \
  1242. frame_width_coded = 0, frame_height_coded = 0, \
  1243. num_lcu_in_frame = 0, num_lcumb = 0; \
  1244. HFI_U32 frame_rc_buf_size = 0; \
  1245. width_in_lcus = ((frame_width) + (lcu_size)-1) / (lcu_size); \
  1246. height_in_lcus = ((frame_height) + (lcu_size)-1) / (lcu_size); \
  1247. num_lcu_in_frame = width_in_lcus * height_in_lcus; \
  1248. frame_width_coded = width_in_lcus * (lcu_size); \
  1249. frame_height_coded = height_in_lcus * (lcu_size); \
  1250. num_lcumb = (frame_height_coded / lcu_size) * \
  1251. ((frame_width_coded + lcu_size * 8) / lcu_size); \
  1252. SIZE_FRAME_RC_BUF_SIZE(frame_rc_buf_size, standard, \
  1253. frame_height_coded, num_vpp_pipes_enc); \
  1254. _size = SIZE_ENC_SLICE_INFO_BUF(num_lcu_in_frame) + \
  1255. SIZE_SLICE_CMD_BUFFER + \
  1256. SIZE_SPS_PPS_SLICE_HDR + \
  1257. frame_rc_buf_size + \
  1258. ENC_BITCNT_BUF_SIZE(num_lcu_in_frame) + \
  1259. ENC_BITMAP_BUF_SIZE(num_lcu_in_frame) + \
  1260. SIZE_BSE_SLICE_CMD_BUF + \
  1261. SIZE_BSE_REG_BUF + \
  1262. SIZE_VPP_REG_BUF + \
  1263. SIZE_LAMBDA_LUT + \
  1264. SIZE_OVERRIDE_BUF(num_lcumb) + \
  1265. SIZE_IR_BUF(num_lcu_in_frame); \
  1266. } while (0)
  1267. #define HFI_BUFFER_NON_COMV_H264E(_size, frame_width, frame_height, \
  1268. num_vpp_pipes_enc) \
  1269. do \
  1270. { \
  1271. HFI_BUFFER_NON_COMV_ENC(_size, frame_width, frame_height, \
  1272. num_vpp_pipes_enc, 16, HFI_CODEC_ENCODE_AVC); \
  1273. } while (0)
  1274. #define HFI_BUFFER_NON_COMV_H265E(_size, frame_width, frame_height, \
  1275. num_vpp_pipes_enc) \
  1276. do \
  1277. { \
  1278. HFI_BUFFER_NON_COMV_ENC(_size, frame_width, frame_height, \
  1279. num_vpp_pipes_enc, 32, HFI_CODEC_ENCODE_HEVC); \
  1280. } while (0)
  1281. #define SIZE_ENC_REF_BUFFER(size, frame_width, frame_height) \
  1282. do \
  1283. { \
  1284. HFI_U32 u_buffer_width = 0, u_buffer_height = 0, \
  1285. u_chroma_buffer_height = 0; \
  1286. u_buffer_height = HFI_ALIGN(frame_height, \
  1287. HFI_VENUS_HEIGHT_ALIGNMENT); \
  1288. u_chroma_buffer_height = frame_height >> 1; \
  1289. u_chroma_buffer_height = HFI_ALIGN(u_chroma_buffer_height, \
  1290. HFI_VENUS_HEIGHT_ALIGNMENT); \
  1291. u_buffer_width = HFI_ALIGN(frame_width, \
  1292. HFI_VENUS_WIDTH_ALIGNMENT); \
  1293. size = (u_buffer_height + u_chroma_buffer_height) * \
  1294. u_buffer_width; \
  1295. } while (0)
  1296. #define SIZE_ENC_TEN_BIT_REF_BUFFER(size, frame_width, frame_height) \
  1297. do \
  1298. { \
  1299. HFI_U32 ref_buf_height = 0, ref_luma_stride_in_bytes = 0, \
  1300. u_ref_stride = 0, luma_size = 0, ref_chrm_height_in_bytes = 0, \
  1301. chroma_size = 0, ref_buf_size = 0; \
  1302. ref_buf_height = (frame_height + \
  1303. (HFI_VENUS_HEIGHT_ALIGNMENT - 1)) \
  1304. & (~(HFI_VENUS_HEIGHT_ALIGNMENT - 1)); \
  1305. ref_luma_stride_in_bytes = ((frame_width + \
  1306. SYSTEM_LAL_TILE10 - 1) / SYSTEM_LAL_TILE10) * \
  1307. SYSTEM_LAL_TILE10; \
  1308. u_ref_stride = 4 * (ref_luma_stride_in_bytes / 3); \
  1309. u_ref_stride = (u_ref_stride + (BUF_SIZE_ALIGN_128 - 1)) &\
  1310. (~(BUF_SIZE_ALIGN_128 - 1)); \
  1311. luma_size = ref_buf_height * u_ref_stride; \
  1312. ref_chrm_height_in_bytes = (((frame_height + 1) >> 1) + \
  1313. (BUF_SIZE_ALIGN_32 - 1)) & (~(BUF_SIZE_ALIGN_32 - 1)); \
  1314. chroma_size = u_ref_stride * ref_chrm_height_in_bytes; \
  1315. luma_size = (luma_size + (BUF_SIZE_ALIGN_4096 - 1)) & \
  1316. (~(BUF_SIZE_ALIGN_4096 - 1)); \
  1317. chroma_size = (chroma_size + (BUF_SIZE_ALIGN_4096 - 1)) & \
  1318. (~(BUF_SIZE_ALIGN_4096 - 1)); \
  1319. ref_buf_size = luma_size + chroma_size; \
  1320. size = ref_buf_size; \
  1321. } while (0)
  1322. #define HFI_BUFFER_DPB_ENC(_size, frame_width, frame_height, is_ten_bit) \
  1323. do \
  1324. { \
  1325. HFI_U32 metadata_stride, metadata_buf_height, meta_size_y, \
  1326. meta_size_c; \
  1327. HFI_U32 ten_bit_ref_buf_size = 0, ref_buf_size = 0; \
  1328. if (!is_ten_bit) \
  1329. { \
  1330. SIZE_ENC_REF_BUFFER(ref_buf_size, frame_width, \
  1331. frame_height); \
  1332. HFI_UBWC_CALC_METADATA_PLANE_STRIDE(metadata_stride, \
  1333. (frame_width), 64, \
  1334. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_WIDTH); \
  1335. HFI_UBWC_METADATA_PLANE_BUFHEIGHT(metadata_buf_height, \
  1336. (frame_height), 16, \
  1337. HFI_COLOR_FORMAT_YUV420_NV12_UBWC_Y_TILE_HEIGHT); \
  1338. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(meta_size_y, \
  1339. metadata_stride, metadata_buf_height); \
  1340. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(meta_size_c, \
  1341. metadata_stride, metadata_buf_height); \
  1342. _size = ref_buf_size + meta_size_y + meta_size_c; \
  1343. } \
  1344. else \
  1345. { \
  1346. SIZE_ENC_TEN_BIT_REF_BUFFER(ten_bit_ref_buf_size, \
  1347. frame_width, frame_height); \
  1348. HFI_UBWC_CALC_METADATA_PLANE_STRIDE(metadata_stride, \
  1349. frame_width, VENUS_METADATA_STRIDE_MULTIPLE, \
  1350. HFI_COLOR_FORMAT_YUV420_TP10_UBWC_Y_TILE_WIDTH); \
  1351. HFI_UBWC_METADATA_PLANE_BUFHEIGHT(metadata_buf_height, \
  1352. frame_height, VENUS_METADATA_HEIGHT_MULTIPLE, \
  1353. HFI_COLOR_FORMAT_YUV420_TP10_UBWC_Y_TILE_HEIGHT); \
  1354. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(meta_size_y, \
  1355. metadata_stride, metadata_buf_height); \
  1356. HFI_UBWC_METADATA_PLANE_BUFFER_SIZE(meta_size_c, \
  1357. metadata_stride, metadata_buf_height); \
  1358. _size = ten_bit_ref_buf_size + meta_size_y + \
  1359. meta_size_c; \
  1360. } \
  1361. } while (0)
  1362. #define HFI_BUFFER_DPB_H264E(_size, frame_width, frame_height) \
  1363. do \
  1364. { \
  1365. HFI_BUFFER_DPB_ENC(_size, frame_width, frame_height, 0); \
  1366. } while (0)
  1367. #define HFI_BUFFER_DPB_H265E(_size, frame_width, frame_height, is_ten_bit) \
  1368. do \
  1369. { \
  1370. HFI_BUFFER_DPB_ENC(_size, frame_width, frame_height, is_ten_bit); \
  1371. } while (0)
  1372. #define HFI_BUFFER_VPSS_ENC(vpss_size, dswidth, dsheight, ds_enable, is_ten_bit) \
  1373. do \
  1374. { \
  1375. vpss_size = 0; \
  1376. if (ds_enable) \
  1377. { \
  1378. HFI_BUFFER_DPB_ENC(vpss_size, dswidth, dsheight, is_ten_bit); \
  1379. } \
  1380. } while (0)
  1381. #define HFI_IRIS2_ENC_MIN_INPUT_BUF_COUNT(numInput, TotalHBLayers) \
  1382. do \
  1383. { \
  1384. numInput = 3; \
  1385. if (TotalHBLayers >= 2) \
  1386. { \
  1387. numInput = (1 << (TotalHBLayers - 1)) + 2; \
  1388. } \
  1389. } while (0)
  1390. #endif /* __HFI_BUFFER_IRIS2__ */