kfd_pm4_headers_ai.h 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #ifndef F32_MES_PM4_PACKETS_H
  24. #define F32_MES_PM4_PACKETS_H
  25. #ifndef PM4_MES_HEADER_DEFINED
  26. #define PM4_MES_HEADER_DEFINED
  27. union PM4_MES_TYPE_3_HEADER {
  28. struct {
  29. uint32_t reserved1 : 8; /* < reserved */
  30. uint32_t opcode : 8; /* < IT opcode */
  31. uint32_t count : 14;/* < number of DWORDs - 1 in the
  32. * information body.
  33. */
  34. uint32_t type : 2; /* < packet identifier.
  35. * It should be 3 for type 3 packets
  36. */
  37. };
  38. uint32_t u32All;
  39. };
  40. #endif /* PM4_MES_HEADER_DEFINED */
  41. /*--------------------MES_SET_RESOURCES--------------------*/
  42. #ifndef PM4_MES_SET_RESOURCES_DEFINED
  43. #define PM4_MES_SET_RESOURCES_DEFINED
  44. enum mes_set_resources_queue_type_enum {
  45. queue_type__mes_set_resources__kernel_interface_queue_kiq = 0,
  46. queue_type__mes_set_resources__hsa_interface_queue_hiq = 1,
  47. queue_type__mes_set_resources__hsa_debug_interface_queue = 4
  48. };
  49. struct pm4_mes_set_resources {
  50. union {
  51. union PM4_MES_TYPE_3_HEADER header; /* header */
  52. uint32_t ordinal1;
  53. };
  54. union {
  55. struct {
  56. uint32_t vmid_mask:16;
  57. uint32_t unmap_latency:8;
  58. uint32_t reserved1:5;
  59. enum mes_set_resources_queue_type_enum queue_type:3;
  60. } bitfields2;
  61. uint32_t ordinal2;
  62. };
  63. uint32_t queue_mask_lo;
  64. uint32_t queue_mask_hi;
  65. uint32_t gws_mask_lo;
  66. uint32_t gws_mask_hi;
  67. union {
  68. struct {
  69. uint32_t oac_mask:16;
  70. uint32_t reserved2:16;
  71. } bitfields7;
  72. uint32_t ordinal7;
  73. };
  74. union {
  75. struct {
  76. uint32_t gds_heap_base:6;
  77. uint32_t reserved3:5;
  78. uint32_t gds_heap_size:6;
  79. uint32_t reserved4:15;
  80. } bitfields8;
  81. uint32_t ordinal8;
  82. };
  83. };
  84. #endif
  85. /*--------------------MES_RUN_LIST--------------------*/
  86. #ifndef PM4_MES_RUN_LIST_DEFINED
  87. #define PM4_MES_RUN_LIST_DEFINED
  88. struct pm4_mes_runlist {
  89. union {
  90. union PM4_MES_TYPE_3_HEADER header; /* header */
  91. uint32_t ordinal1;
  92. };
  93. union {
  94. struct {
  95. uint32_t reserved1:2;
  96. uint32_t ib_base_lo:30;
  97. } bitfields2;
  98. uint32_t ordinal2;
  99. };
  100. uint32_t ib_base_hi;
  101. union {
  102. struct {
  103. uint32_t ib_size:20;
  104. uint32_t chain:1;
  105. uint32_t offload_polling:1;
  106. uint32_t reserved2:1;
  107. uint32_t valid:1;
  108. uint32_t process_cnt:4;
  109. uint32_t reserved3:4;
  110. } bitfields4;
  111. uint32_t ordinal4;
  112. };
  113. };
  114. #endif
  115. /*--------------------MES_MAP_PROCESS--------------------*/
  116. #ifndef PM4_MES_MAP_PROCESS_DEFINED
  117. #define PM4_MES_MAP_PROCESS_DEFINED
  118. struct pm4_mes_map_process {
  119. union {
  120. union PM4_MES_TYPE_3_HEADER header; /* header */
  121. uint32_t ordinal1;
  122. };
  123. union {
  124. struct {
  125. uint32_t pasid:16;
  126. uint32_t reserved1:8;
  127. uint32_t diq_enable:1;
  128. uint32_t process_quantum:7;
  129. } bitfields2;
  130. uint32_t ordinal2;
  131. };
  132. uint32_t vm_context_page_table_base_addr_lo32;
  133. uint32_t vm_context_page_table_base_addr_hi32;
  134. uint32_t sh_mem_bases;
  135. uint32_t sh_mem_config;
  136. uint32_t sq_shader_tba_lo;
  137. uint32_t sq_shader_tba_hi;
  138. uint32_t sq_shader_tma_lo;
  139. uint32_t sq_shader_tma_hi;
  140. uint32_t reserved6;
  141. uint32_t gds_addr_lo;
  142. uint32_t gds_addr_hi;
  143. union {
  144. struct {
  145. uint32_t num_gws:6;
  146. uint32_t reserved7:1;
  147. uint32_t sdma_enable:1;
  148. uint32_t num_oac:4;
  149. uint32_t reserved8:4;
  150. uint32_t gds_size:6;
  151. uint32_t num_queues:10;
  152. } bitfields14;
  153. uint32_t ordinal14;
  154. };
  155. uint32_t completion_signal_lo;
  156. uint32_t completion_signal_hi;
  157. };
  158. #endif
  159. /*--------------------MES_MAP_PROCESS_VM--------------------*/
  160. #ifndef PM4_MES_MAP_PROCESS_VM_DEFINED
  161. #define PM4_MES_MAP_PROCESS_VM_DEFINED
  162. struct PM4_MES_MAP_PROCESS_VM {
  163. union {
  164. union PM4_MES_TYPE_3_HEADER header; /* header */
  165. uint32_t ordinal1;
  166. };
  167. uint32_t reserved1;
  168. uint32_t vm_context_cntl;
  169. uint32_t reserved2;
  170. uint32_t vm_context_page_table_end_addr_lo32;
  171. uint32_t vm_context_page_table_end_addr_hi32;
  172. uint32_t vm_context_page_table_start_addr_lo32;
  173. uint32_t vm_context_page_table_start_addr_hi32;
  174. uint32_t reserved3;
  175. uint32_t reserved4;
  176. uint32_t reserved5;
  177. uint32_t reserved6;
  178. uint32_t reserved7;
  179. uint32_t reserved8;
  180. uint32_t completion_signal_lo32;
  181. uint32_t completion_signal_hi32;
  182. };
  183. #endif
  184. /*--------------------MES_MAP_QUEUES--------------------*/
  185. #ifndef PM4_MES_MAP_QUEUES_VI_DEFINED
  186. #define PM4_MES_MAP_QUEUES_VI_DEFINED
  187. enum mes_map_queues_queue_sel_enum {
  188. queue_sel__mes_map_queues__map_to_specified_queue_slots_vi = 0,
  189. queue_sel__mes_map_queues__map_to_hws_determined_queue_slots_vi = 1
  190. };
  191. enum mes_map_queues_queue_type_enum {
  192. queue_type__mes_map_queues__normal_compute_vi = 0,
  193. queue_type__mes_map_queues__debug_interface_queue_vi = 1,
  194. queue_type__mes_map_queues__normal_latency_static_queue_vi = 2,
  195. queue_type__mes_map_queues__low_latency_static_queue_vi = 3
  196. };
  197. enum mes_map_queues_alloc_format_enum {
  198. alloc_format__mes_map_queues__one_per_pipe_vi = 0,
  199. alloc_format__mes_map_queues__all_on_one_pipe_vi = 1
  200. };
  201. enum mes_map_queues_engine_sel_enum {
  202. engine_sel__mes_map_queues__compute_vi = 0,
  203. engine_sel__mes_map_queues__sdma0_vi = 2,
  204. engine_sel__mes_map_queues__sdma1_vi = 3
  205. };
  206. struct pm4_mes_map_queues {
  207. union {
  208. union PM4_MES_TYPE_3_HEADER header; /* header */
  209. uint32_t ordinal1;
  210. };
  211. union {
  212. struct {
  213. uint32_t reserved1:4;
  214. enum mes_map_queues_queue_sel_enum queue_sel:2;
  215. uint32_t reserved2:15;
  216. enum mes_map_queues_queue_type_enum queue_type:3;
  217. enum mes_map_queues_alloc_format_enum alloc_format:2;
  218. enum mes_map_queues_engine_sel_enum engine_sel:3;
  219. uint32_t num_queues:3;
  220. } bitfields2;
  221. uint32_t ordinal2;
  222. };
  223. union {
  224. struct {
  225. uint32_t reserved3:1;
  226. uint32_t check_disable:1;
  227. uint32_t doorbell_offset:26;
  228. uint32_t reserved4:4;
  229. } bitfields3;
  230. uint32_t ordinal3;
  231. };
  232. uint32_t mqd_addr_lo;
  233. uint32_t mqd_addr_hi;
  234. uint32_t wptr_addr_lo;
  235. uint32_t wptr_addr_hi;
  236. };
  237. #endif
  238. /*--------------------MES_QUERY_STATUS--------------------*/
  239. #ifndef PM4_MES_QUERY_STATUS_DEFINED
  240. #define PM4_MES_QUERY_STATUS_DEFINED
  241. enum mes_query_status_interrupt_sel_enum {
  242. interrupt_sel__mes_query_status__completion_status = 0,
  243. interrupt_sel__mes_query_status__process_status = 1,
  244. interrupt_sel__mes_query_status__queue_status = 2
  245. };
  246. enum mes_query_status_command_enum {
  247. command__mes_query_status__interrupt_only = 0,
  248. command__mes_query_status__fence_only_immediate = 1,
  249. command__mes_query_status__fence_only_after_write_ack = 2,
  250. command__mes_query_status__fence_wait_for_write_ack_send_interrupt = 3
  251. };
  252. enum mes_query_status_engine_sel_enum {
  253. engine_sel__mes_query_status__compute = 0,
  254. engine_sel__mes_query_status__sdma0_queue = 2,
  255. engine_sel__mes_query_status__sdma1_queue = 3
  256. };
  257. struct pm4_mes_query_status {
  258. union {
  259. union PM4_MES_TYPE_3_HEADER header; /* header */
  260. uint32_t ordinal1;
  261. };
  262. union {
  263. struct {
  264. uint32_t context_id:28;
  265. enum mes_query_status_interrupt_sel_enum interrupt_sel:2;
  266. enum mes_query_status_command_enum command:2;
  267. } bitfields2;
  268. uint32_t ordinal2;
  269. };
  270. union {
  271. struct {
  272. uint32_t pasid:16;
  273. uint32_t reserved1:16;
  274. } bitfields3a;
  275. struct {
  276. uint32_t reserved2:2;
  277. uint32_t doorbell_offset:26;
  278. enum mes_query_status_engine_sel_enum engine_sel:3;
  279. uint32_t reserved3:1;
  280. } bitfields3b;
  281. uint32_t ordinal3;
  282. };
  283. uint32_t addr_lo;
  284. uint32_t addr_hi;
  285. uint32_t data_lo;
  286. uint32_t data_hi;
  287. };
  288. #endif
  289. /*--------------------MES_UNMAP_QUEUES--------------------*/
  290. #ifndef PM4_MES_UNMAP_QUEUES_DEFINED
  291. #define PM4_MES_UNMAP_QUEUES_DEFINED
  292. enum mes_unmap_queues_action_enum {
  293. action__mes_unmap_queues__preempt_queues = 0,
  294. action__mes_unmap_queues__reset_queues = 1,
  295. action__mes_unmap_queues__disable_process_queues = 2,
  296. action__mes_unmap_queues__reserved = 3
  297. };
  298. enum mes_unmap_queues_queue_sel_enum {
  299. queue_sel__mes_unmap_queues__perform_request_on_specified_queues = 0,
  300. queue_sel__mes_unmap_queues__perform_request_on_pasid_queues = 1,
  301. queue_sel__mes_unmap_queues__unmap_all_queues = 2,
  302. queue_sel__mes_unmap_queues__unmap_all_non_static_queues = 3
  303. };
  304. enum mes_unmap_queues_engine_sel_enum {
  305. engine_sel__mes_unmap_queues__compute = 0,
  306. engine_sel__mes_unmap_queues__sdma0 = 2,
  307. engine_sel__mes_unmap_queues__sdmal = 3
  308. };
  309. struct pm4_mes_unmap_queues {
  310. union {
  311. union PM4_MES_TYPE_3_HEADER header; /* header */
  312. uint32_t ordinal1;
  313. };
  314. union {
  315. struct {
  316. enum mes_unmap_queues_action_enum action:2;
  317. uint32_t reserved1:2;
  318. enum mes_unmap_queues_queue_sel_enum queue_sel:2;
  319. uint32_t reserved2:20;
  320. enum mes_unmap_queues_engine_sel_enum engine_sel:3;
  321. uint32_t num_queues:3;
  322. } bitfields2;
  323. uint32_t ordinal2;
  324. };
  325. union {
  326. struct {
  327. uint32_t pasid:16;
  328. uint32_t reserved3:16;
  329. } bitfields3a;
  330. struct {
  331. uint32_t reserved4:2;
  332. uint32_t doorbell_offset0:26;
  333. int32_t reserved5:4;
  334. } bitfields3b;
  335. uint32_t ordinal3;
  336. };
  337. union {
  338. struct {
  339. uint32_t reserved6:2;
  340. uint32_t doorbell_offset1:26;
  341. uint32_t reserved7:4;
  342. } bitfields4;
  343. uint32_t ordinal4;
  344. };
  345. union {
  346. struct {
  347. uint32_t reserved8:2;
  348. uint32_t doorbell_offset2:26;
  349. uint32_t reserved9:4;
  350. } bitfields5;
  351. uint32_t ordinal5;
  352. };
  353. union {
  354. struct {
  355. uint32_t reserved10:2;
  356. uint32_t doorbell_offset3:26;
  357. uint32_t reserved11:4;
  358. } bitfields6;
  359. uint32_t ordinal6;
  360. };
  361. };
  362. #endif
  363. #ifndef PM4_MEC_RELEASE_MEM_DEFINED
  364. #define PM4_MEC_RELEASE_MEM_DEFINED
  365. enum mec_release_mem_event_index_enum {
  366. event_index__mec_release_mem__end_of_pipe = 5,
  367. event_index__mec_release_mem__shader_done = 6
  368. };
  369. enum mec_release_mem_cache_policy_enum {
  370. cache_policy__mec_release_mem__lru = 0,
  371. cache_policy__mec_release_mem__stream = 1
  372. };
  373. enum mec_release_mem_pq_exe_status_enum {
  374. pq_exe_status__mec_release_mem__default = 0,
  375. pq_exe_status__mec_release_mem__phase_update = 1
  376. };
  377. enum mec_release_mem_dst_sel_enum {
  378. dst_sel__mec_release_mem__memory_controller = 0,
  379. dst_sel__mec_release_mem__tc_l2 = 1,
  380. dst_sel__mec_release_mem__queue_write_pointer_register = 2,
  381. dst_sel__mec_release_mem__queue_write_pointer_poll_mask_bit = 3
  382. };
  383. enum mec_release_mem_int_sel_enum {
  384. int_sel__mec_release_mem__none = 0,
  385. int_sel__mec_release_mem__send_interrupt_only = 1,
  386. int_sel__mec_release_mem__send_interrupt_after_write_confirm = 2,
  387. int_sel__mec_release_mem__send_data_after_write_confirm = 3,
  388. int_sel__mec_release_mem__unconditionally_send_int_ctxid = 4,
  389. int_sel__mec_release_mem__conditionally_send_int_ctxid_based_on_32_bit_compare = 5,
  390. int_sel__mec_release_mem__conditionally_send_int_ctxid_based_on_64_bit_compare = 6
  391. };
  392. enum mec_release_mem_data_sel_enum {
  393. data_sel__mec_release_mem__none = 0,
  394. data_sel__mec_release_mem__send_32_bit_low = 1,
  395. data_sel__mec_release_mem__send_64_bit_data = 2,
  396. data_sel__mec_release_mem__send_gpu_clock_counter = 3,
  397. data_sel__mec_release_mem__send_cp_perfcounter_hi_lo = 4,
  398. data_sel__mec_release_mem__store_gds_data_to_memory = 5
  399. };
  400. struct pm4_mec_release_mem {
  401. union {
  402. union PM4_MES_TYPE_3_HEADER header; /*header */
  403. unsigned int ordinal1;
  404. };
  405. union {
  406. struct {
  407. unsigned int event_type:6;
  408. unsigned int reserved1:2;
  409. enum mec_release_mem_event_index_enum event_index:4;
  410. unsigned int tcl1_vol_action_ena:1;
  411. unsigned int tc_vol_action_ena:1;
  412. unsigned int reserved2:1;
  413. unsigned int tc_wb_action_ena:1;
  414. unsigned int tcl1_action_ena:1;
  415. unsigned int tc_action_ena:1;
  416. uint32_t reserved3:1;
  417. uint32_t tc_nc_action_ena:1;
  418. uint32_t tc_wc_action_ena:1;
  419. uint32_t tc_md_action_ena:1;
  420. uint32_t reserved4:3;
  421. enum mec_release_mem_cache_policy_enum cache_policy:2;
  422. uint32_t reserved5:2;
  423. enum mec_release_mem_pq_exe_status_enum pq_exe_status:1;
  424. uint32_t reserved6:2;
  425. } bitfields2;
  426. unsigned int ordinal2;
  427. };
  428. union {
  429. struct {
  430. uint32_t reserved7:16;
  431. enum mec_release_mem_dst_sel_enum dst_sel:2;
  432. uint32_t reserved8:6;
  433. enum mec_release_mem_int_sel_enum int_sel:3;
  434. uint32_t reserved9:2;
  435. enum mec_release_mem_data_sel_enum data_sel:3;
  436. } bitfields3;
  437. unsigned int ordinal3;
  438. };
  439. union {
  440. struct {
  441. uint32_t reserved10:2;
  442. unsigned int address_lo_32b:30;
  443. } bitfields4;
  444. struct {
  445. uint32_t reserved11:3;
  446. uint32_t address_lo_64b:29;
  447. } bitfields4b;
  448. uint32_t reserved12;
  449. unsigned int ordinal4;
  450. };
  451. union {
  452. uint32_t address_hi;
  453. uint32_t reserved13;
  454. uint32_t ordinal5;
  455. };
  456. union {
  457. uint32_t data_lo;
  458. uint32_t cmp_data_lo;
  459. struct {
  460. uint32_t dw_offset:16;
  461. uint32_t num_dwords:16;
  462. } bitfields6c;
  463. uint32_t reserved14;
  464. uint32_t ordinal6;
  465. };
  466. union {
  467. uint32_t data_hi;
  468. uint32_t cmp_data_hi;
  469. uint32_t reserved15;
  470. uint32_t reserved16;
  471. uint32_t ordinal7;
  472. };
  473. uint32_t int_ctxid;
  474. };
  475. #endif
  476. enum {
  477. CACHE_FLUSH_AND_INV_TS_EVENT = 0x00000014
  478. };
  479. #endif