amdgpu_virt.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440
  1. /*
  2. * Copyright 2016 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. */
  23. #include "amdgpu.h"
  24. #define MAX_KIQ_REG_WAIT 5000 /* in usecs, 5ms */
  25. #define MAX_KIQ_REG_BAILOUT_INTERVAL 5 /* in msecs, 5ms */
  26. #define MAX_KIQ_REG_TRY 20
  27. uint64_t amdgpu_csa_vaddr(struct amdgpu_device *adev)
  28. {
  29. uint64_t addr = adev->vm_manager.max_pfn << AMDGPU_GPU_PAGE_SHIFT;
  30. addr -= AMDGPU_VA_RESERVED_SIZE;
  31. if (addr >= AMDGPU_VA_HOLE_START)
  32. addr |= AMDGPU_VA_HOLE_END;
  33. return addr;
  34. }
  35. bool amdgpu_virt_mmio_blocked(struct amdgpu_device *adev)
  36. {
  37. /* By now all MMIO pages except mailbox are blocked */
  38. /* if blocking is enabled in hypervisor. Choose the */
  39. /* SCRATCH_REG0 to test. */
  40. return RREG32_NO_KIQ(0xc040) == 0xffffffff;
  41. }
  42. int amdgpu_allocate_static_csa(struct amdgpu_device *adev)
  43. {
  44. int r;
  45. void *ptr;
  46. r = amdgpu_bo_create_kernel(adev, AMDGPU_CSA_SIZE, PAGE_SIZE,
  47. AMDGPU_GEM_DOMAIN_VRAM, &adev->virt.csa_obj,
  48. &adev->virt.csa_vmid0_addr, &ptr);
  49. if (r)
  50. return r;
  51. memset(ptr, 0, AMDGPU_CSA_SIZE);
  52. return 0;
  53. }
  54. void amdgpu_free_static_csa(struct amdgpu_device *adev) {
  55. amdgpu_bo_free_kernel(&adev->virt.csa_obj,
  56. &adev->virt.csa_vmid0_addr,
  57. NULL);
  58. }
  59. /*
  60. * amdgpu_map_static_csa should be called during amdgpu_vm_init
  61. * it maps virtual address amdgpu_csa_vaddr() to this VM, and each command
  62. * submission of GFX should use this virtual address within META_DATA init
  63. * package to support SRIOV gfx preemption.
  64. */
  65. int amdgpu_map_static_csa(struct amdgpu_device *adev, struct amdgpu_vm *vm,
  66. struct amdgpu_bo_va **bo_va)
  67. {
  68. uint64_t csa_addr = amdgpu_csa_vaddr(adev) & AMDGPU_VA_HOLE_MASK;
  69. struct ww_acquire_ctx ticket;
  70. struct list_head list;
  71. struct amdgpu_bo_list_entry pd;
  72. struct ttm_validate_buffer csa_tv;
  73. int r;
  74. INIT_LIST_HEAD(&list);
  75. INIT_LIST_HEAD(&csa_tv.head);
  76. csa_tv.bo = &adev->virt.csa_obj->tbo;
  77. csa_tv.shared = true;
  78. list_add(&csa_tv.head, &list);
  79. amdgpu_vm_get_pd_bo(vm, &list, &pd);
  80. r = ttm_eu_reserve_buffers(&ticket, &list, true, NULL);
  81. if (r) {
  82. DRM_ERROR("failed to reserve CSA,PD BOs: err=%d\n", r);
  83. return r;
  84. }
  85. *bo_va = amdgpu_vm_bo_add(adev, vm, adev->virt.csa_obj);
  86. if (!*bo_va) {
  87. ttm_eu_backoff_reservation(&ticket, &list);
  88. DRM_ERROR("failed to create bo_va for static CSA\n");
  89. return -ENOMEM;
  90. }
  91. r = amdgpu_vm_alloc_pts(adev, (*bo_va)->base.vm, csa_addr,
  92. AMDGPU_CSA_SIZE);
  93. if (r) {
  94. DRM_ERROR("failed to allocate pts for static CSA, err=%d\n", r);
  95. amdgpu_vm_bo_rmv(adev, *bo_va);
  96. ttm_eu_backoff_reservation(&ticket, &list);
  97. return r;
  98. }
  99. r = amdgpu_vm_bo_map(adev, *bo_va, csa_addr, 0, AMDGPU_CSA_SIZE,
  100. AMDGPU_PTE_READABLE | AMDGPU_PTE_WRITEABLE |
  101. AMDGPU_PTE_EXECUTABLE);
  102. if (r) {
  103. DRM_ERROR("failed to do bo_map on static CSA, err=%d\n", r);
  104. amdgpu_vm_bo_rmv(adev, *bo_va);
  105. ttm_eu_backoff_reservation(&ticket, &list);
  106. return r;
  107. }
  108. ttm_eu_backoff_reservation(&ticket, &list);
  109. return 0;
  110. }
  111. void amdgpu_virt_init_setting(struct amdgpu_device *adev)
  112. {
  113. /* enable virtual display */
  114. adev->mode_info.num_crtc = 1;
  115. adev->enable_virtual_display = true;
  116. adev->cg_flags = 0;
  117. adev->pg_flags = 0;
  118. }
  119. uint32_t amdgpu_virt_kiq_rreg(struct amdgpu_device *adev, uint32_t reg)
  120. {
  121. signed long r, cnt = 0;
  122. unsigned long flags;
  123. uint32_t seq;
  124. struct amdgpu_kiq *kiq = &adev->gfx.kiq;
  125. struct amdgpu_ring *ring = &kiq->ring;
  126. BUG_ON(!ring->funcs->emit_rreg);
  127. spin_lock_irqsave(&kiq->ring_lock, flags);
  128. amdgpu_ring_alloc(ring, 32);
  129. amdgpu_ring_emit_rreg(ring, reg);
  130. amdgpu_fence_emit_polling(ring, &seq);
  131. amdgpu_ring_commit(ring);
  132. spin_unlock_irqrestore(&kiq->ring_lock, flags);
  133. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  134. /* don't wait anymore for gpu reset case because this way may
  135. * block gpu_recover() routine forever, e.g. this virt_kiq_rreg
  136. * is triggered in TTM and ttm_bo_lock_delayed_workqueue() will
  137. * never return if we keep waiting in virt_kiq_rreg, which cause
  138. * gpu_recover() hang there.
  139. *
  140. * also don't wait anymore for IRQ context
  141. * */
  142. if (r < 1 && (adev->in_gpu_reset || in_interrupt()))
  143. goto failed_kiq_read;
  144. if (in_interrupt())
  145. might_sleep();
  146. while (r < 1 && cnt++ < MAX_KIQ_REG_TRY) {
  147. msleep(MAX_KIQ_REG_BAILOUT_INTERVAL);
  148. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  149. }
  150. if (cnt > MAX_KIQ_REG_TRY)
  151. goto failed_kiq_read;
  152. return adev->wb.wb[adev->virt.reg_val_offs];
  153. failed_kiq_read:
  154. pr_err("failed to read reg:%x\n", reg);
  155. return ~0;
  156. }
  157. void amdgpu_virt_kiq_wreg(struct amdgpu_device *adev, uint32_t reg, uint32_t v)
  158. {
  159. signed long r, cnt = 0;
  160. unsigned long flags;
  161. uint32_t seq;
  162. struct amdgpu_kiq *kiq = &adev->gfx.kiq;
  163. struct amdgpu_ring *ring = &kiq->ring;
  164. BUG_ON(!ring->funcs->emit_wreg);
  165. spin_lock_irqsave(&kiq->ring_lock, flags);
  166. amdgpu_ring_alloc(ring, 32);
  167. amdgpu_ring_emit_wreg(ring, reg, v);
  168. amdgpu_fence_emit_polling(ring, &seq);
  169. amdgpu_ring_commit(ring);
  170. spin_unlock_irqrestore(&kiq->ring_lock, flags);
  171. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  172. /* don't wait anymore for gpu reset case because this way may
  173. * block gpu_recover() routine forever, e.g. this virt_kiq_rreg
  174. * is triggered in TTM and ttm_bo_lock_delayed_workqueue() will
  175. * never return if we keep waiting in virt_kiq_rreg, which cause
  176. * gpu_recover() hang there.
  177. *
  178. * also don't wait anymore for IRQ context
  179. * */
  180. if (r < 1 && (adev->in_gpu_reset || in_interrupt()))
  181. goto failed_kiq_write;
  182. if (in_interrupt())
  183. might_sleep();
  184. while (r < 1 && cnt++ < MAX_KIQ_REG_TRY) {
  185. msleep(MAX_KIQ_REG_BAILOUT_INTERVAL);
  186. r = amdgpu_fence_wait_polling(ring, seq, MAX_KIQ_REG_WAIT);
  187. }
  188. if (cnt > MAX_KIQ_REG_TRY)
  189. goto failed_kiq_write;
  190. return;
  191. failed_kiq_write:
  192. pr_err("failed to write reg:%x\n", reg);
  193. }
  194. /**
  195. * amdgpu_virt_request_full_gpu() - request full gpu access
  196. * @amdgpu: amdgpu device.
  197. * @init: is driver init time.
  198. * When start to init/fini driver, first need to request full gpu access.
  199. * Return: Zero if request success, otherwise will return error.
  200. */
  201. int amdgpu_virt_request_full_gpu(struct amdgpu_device *adev, bool init)
  202. {
  203. struct amdgpu_virt *virt = &adev->virt;
  204. int r;
  205. if (virt->ops && virt->ops->req_full_gpu) {
  206. r = virt->ops->req_full_gpu(adev, init);
  207. if (r)
  208. return r;
  209. adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
  210. }
  211. return 0;
  212. }
  213. /**
  214. * amdgpu_virt_release_full_gpu() - release full gpu access
  215. * @amdgpu: amdgpu device.
  216. * @init: is driver init time.
  217. * When finishing driver init/fini, need to release full gpu access.
  218. * Return: Zero if release success, otherwise will returen error.
  219. */
  220. int amdgpu_virt_release_full_gpu(struct amdgpu_device *adev, bool init)
  221. {
  222. struct amdgpu_virt *virt = &adev->virt;
  223. int r;
  224. if (virt->ops && virt->ops->rel_full_gpu) {
  225. r = virt->ops->rel_full_gpu(adev, init);
  226. if (r)
  227. return r;
  228. adev->virt.caps |= AMDGPU_SRIOV_CAPS_RUNTIME;
  229. }
  230. return 0;
  231. }
  232. /**
  233. * amdgpu_virt_reset_gpu() - reset gpu
  234. * @amdgpu: amdgpu device.
  235. * Send reset command to GPU hypervisor to reset GPU that VM is using
  236. * Return: Zero if reset success, otherwise will return error.
  237. */
  238. int amdgpu_virt_reset_gpu(struct amdgpu_device *adev)
  239. {
  240. struct amdgpu_virt *virt = &adev->virt;
  241. int r;
  242. if (virt->ops && virt->ops->reset_gpu) {
  243. r = virt->ops->reset_gpu(adev);
  244. if (r)
  245. return r;
  246. adev->virt.caps &= ~AMDGPU_SRIOV_CAPS_RUNTIME;
  247. }
  248. return 0;
  249. }
  250. /**
  251. * amdgpu_virt_wait_reset() - wait for reset gpu completed
  252. * @amdgpu: amdgpu device.
  253. * Wait for GPU reset completed.
  254. * Return: Zero if reset success, otherwise will return error.
  255. */
  256. int amdgpu_virt_wait_reset(struct amdgpu_device *adev)
  257. {
  258. struct amdgpu_virt *virt = &adev->virt;
  259. if (!virt->ops || !virt->ops->wait_reset)
  260. return -EINVAL;
  261. return virt->ops->wait_reset(adev);
  262. }
  263. /**
  264. * amdgpu_virt_alloc_mm_table() - alloc memory for mm table
  265. * @amdgpu: amdgpu device.
  266. * MM table is used by UVD and VCE for its initialization
  267. * Return: Zero if allocate success.
  268. */
  269. int amdgpu_virt_alloc_mm_table(struct amdgpu_device *adev)
  270. {
  271. int r;
  272. if (!amdgpu_sriov_vf(adev) || adev->virt.mm_table.gpu_addr)
  273. return 0;
  274. r = amdgpu_bo_create_kernel(adev, PAGE_SIZE, PAGE_SIZE,
  275. AMDGPU_GEM_DOMAIN_VRAM,
  276. &adev->virt.mm_table.bo,
  277. &adev->virt.mm_table.gpu_addr,
  278. (void *)&adev->virt.mm_table.cpu_addr);
  279. if (r) {
  280. DRM_ERROR("failed to alloc mm table and error = %d.\n", r);
  281. return r;
  282. }
  283. memset((void *)adev->virt.mm_table.cpu_addr, 0, PAGE_SIZE);
  284. DRM_INFO("MM table gpu addr = 0x%llx, cpu addr = %p.\n",
  285. adev->virt.mm_table.gpu_addr,
  286. adev->virt.mm_table.cpu_addr);
  287. return 0;
  288. }
  289. /**
  290. * amdgpu_virt_free_mm_table() - free mm table memory
  291. * @amdgpu: amdgpu device.
  292. * Free MM table memory
  293. */
  294. void amdgpu_virt_free_mm_table(struct amdgpu_device *adev)
  295. {
  296. if (!amdgpu_sriov_vf(adev) || !adev->virt.mm_table.gpu_addr)
  297. return;
  298. amdgpu_bo_free_kernel(&adev->virt.mm_table.bo,
  299. &adev->virt.mm_table.gpu_addr,
  300. (void *)&adev->virt.mm_table.cpu_addr);
  301. adev->virt.mm_table.gpu_addr = 0;
  302. }
  303. int amdgpu_virt_fw_reserve_get_checksum(void *obj,
  304. unsigned long obj_size,
  305. unsigned int key,
  306. unsigned int chksum)
  307. {
  308. unsigned int ret = key;
  309. unsigned long i = 0;
  310. unsigned char *pos;
  311. pos = (char *)obj;
  312. /* calculate checksum */
  313. for (i = 0; i < obj_size; ++i)
  314. ret += *(pos + i);
  315. /* minus the chksum itself */
  316. pos = (char *)&chksum;
  317. for (i = 0; i < sizeof(chksum); ++i)
  318. ret -= *(pos + i);
  319. return ret;
  320. }
  321. void amdgpu_virt_init_data_exchange(struct amdgpu_device *adev)
  322. {
  323. uint32_t pf2vf_size = 0;
  324. uint32_t checksum = 0;
  325. uint32_t checkval;
  326. char *str;
  327. adev->virt.fw_reserve.p_pf2vf = NULL;
  328. adev->virt.fw_reserve.p_vf2pf = NULL;
  329. if (adev->fw_vram_usage.va != NULL) {
  330. adev->virt.fw_reserve.p_pf2vf =
  331. (struct amdgim_pf2vf_info_header *)(
  332. adev->fw_vram_usage.va + AMDGIM_DATAEXCHANGE_OFFSET);
  333. AMDGPU_FW_VRAM_PF2VF_READ(adev, header.size, &pf2vf_size);
  334. AMDGPU_FW_VRAM_PF2VF_READ(adev, checksum, &checksum);
  335. AMDGPU_FW_VRAM_PF2VF_READ(adev, feature_flags, &adev->virt.gim_feature);
  336. /* pf2vf message must be in 4K */
  337. if (pf2vf_size > 0 && pf2vf_size < 4096) {
  338. checkval = amdgpu_virt_fw_reserve_get_checksum(
  339. adev->virt.fw_reserve.p_pf2vf, pf2vf_size,
  340. adev->virt.fw_reserve.checksum_key, checksum);
  341. if (checkval == checksum) {
  342. adev->virt.fw_reserve.p_vf2pf =
  343. ((void *)adev->virt.fw_reserve.p_pf2vf +
  344. pf2vf_size);
  345. memset((void *)adev->virt.fw_reserve.p_vf2pf, 0,
  346. sizeof(amdgim_vf2pf_info));
  347. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, header.version,
  348. AMDGPU_FW_VRAM_VF2PF_VER);
  349. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, header.size,
  350. sizeof(amdgim_vf2pf_info));
  351. AMDGPU_FW_VRAM_VF2PF_READ(adev, driver_version,
  352. &str);
  353. #ifdef MODULE
  354. if (THIS_MODULE->version != NULL)
  355. strcpy(str, THIS_MODULE->version);
  356. else
  357. #endif
  358. strcpy(str, "N/A");
  359. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, driver_cert,
  360. 0);
  361. AMDGPU_FW_VRAM_VF2PF_WRITE(adev, checksum,
  362. amdgpu_virt_fw_reserve_get_checksum(
  363. adev->virt.fw_reserve.p_vf2pf,
  364. pf2vf_size,
  365. adev->virt.fw_reserve.checksum_key, 0));
  366. }
  367. }
  368. }
  369. }