evergreen_dma.c source code [linux/drivers/gpu/drm/radeon/evergreen_dma.c]

1	/*
2	* Copyright 2010 Advanced Micro Devices, Inc.
3	*
4	* Permission is hereby granted, free of charge, to any person obtaining a
5	* copy of this software and associated documentation files (the "Software"),
6	* to deal in the Software without restriction, including without limitation
7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
8	* and/or sell copies of the Software, and to permit persons to whom the
9	* Software is furnished to do so, subject to the following conditions:
10	*
11	* The above copyright notice and this permission notice shall be included in
12	* all copies or substantial portions of the Software.
13	*
14	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17	* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18	* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19	* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20	* OTHER DEALINGS IN THE SOFTWARE.
21	*
22	* Authors: Alex Deucher
23	*/
24
25	#include "radeon.h"
26	#include "radeon_asic.h"
27	#include "evergreen.h"
28	#include "evergreend.h"
29
30	/**
31	* evergreen_dma_fence_ring_emit - emit a fence on the DMA ring
32	*
33	* @rdev: radeon_device pointer
34	* @fence: radeon fence object
35	*
36	* Add a DMA fence packet to the ring to write
37	* the fence seq number and DMA trap packet to generate
38	* an interrupt if needed (evergreen-SI).
39	*/
40	void evergreen_dma_fence_ring_emit(struct radeon_device *rdev,
41	struct radeon_fence *fence)
42	{
43	struct radeon_ring *ring = &rdev->ring[fence->ring];
44	u64 addr = rdev->fence_drv[fence->ring].gpu_addr;
45	/ write the fence /
46	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_FENCE, `0`, `0`));
47	radeon_ring_write(ring, v: addr & `0xfffffffc`);
48	radeon_ring_write(ring, v: (upper_32_bits(addr) & `0xff`));
49	radeon_ring_write(ring, v: fence->seq);
50	/ generate an interrupt /
51	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_TRAP, `0`, `0`));
52	/ flush HDP /
53	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_SRBM_WRITE, `0`, `0`));
54	radeon_ring_write(ring, v: (`0xf` << `16`) \| (HDP_MEM_COHERENCY_FLUSH_CNTL >> `2`));
55	radeon_ring_write(ring, v: `1`);
56	}
57
58	/**
59	* evergreen_dma_ring_ib_execute - schedule an IB on the DMA engine
60	*
61	* @rdev: radeon_device pointer
62	* @ib: IB object to schedule
63	*
64	* Schedule an IB in the DMA ring (evergreen).
65	*/
66	void evergreen_dma_ring_ib_execute(struct radeon_device *rdev,
67	struct radeon_ib *ib)
68	{
69	struct radeon_ring *ring = &rdev->ring[ib->ring];
70
71	if (rdev->wb.enabled) {
72	u32 next_rptr = ring->wptr + `4`;
73	while ((next_rptr & `7`) != `5`)
74	next_rptr++;
75	next_rptr += `3`;
76	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_WRITE, `0`, `1`));
77	radeon_ring_write(ring, v: ring->next_rptr_gpu_addr & `0xfffffffc`);
78	radeon_ring_write(ring, upper_32_bits(ring->next_rptr_gpu_addr) & `0xff`);
79	radeon_ring_write(ring, v: next_rptr);
80	}
81
82	/ The indirect buffer packet must end on an 8 DW boundary in the DMA ring.*
83	* Pad as necessary with NOPs.
84	*/
85	while ((ring->wptr & `7`) != `5`)
86	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_NOP, `0`, `0`));
87	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_INDIRECT_BUFFER, `0`, `0`));
88	radeon_ring_write(ring, v: (ib->gpu_addr & `0xFFFFFFE0`));
89	radeon_ring_write(ring, v: (ib->length_dw << `12`) \| (upper_32_bits(ib->gpu_addr) & `0xFF`));
90
91	}
92
93	/**
94	* evergreen_copy_dma - copy pages using the DMA engine
95	*
96	* @rdev: radeon_device pointer
97	* @src_offset: src GPU address
98	* @dst_offset: dst GPU address
99	* @num_gpu_pages: number of GPU pages to xfer
100	* @resv: reservation object with embedded fence
101	*
102	* Copy GPU paging using the DMA engine (evergreen-cayman).
103	* Used by the radeon ttm implementation to move pages if
104	* registered as the asic copy callback.
105	*/
106	struct radeon_fence evergreen_copy_dma(struct* radeon_device *rdev,
107	uint64_t src_offset,
108	uint64_t dst_offset,
109	unsigned num_gpu_pages,
110	struct dma_resv *resv)
111	{
112	struct radeon_fence *fence;
113	struct radeon_sync sync;
114	int ring_index = rdev->asic->copy.dma_ring_index;
115	struct radeon_ring *ring = &rdev->ring[ring_index];
116	u32 size_in_dw, cur_size_in_dw;
117	int i, num_loops;
118	int r = `0`;
119
120	radeon_sync_create(sync: &sync);
121
122	size_in_dw = (num_gpu_pages << RADEON_GPU_PAGE_SHIFT) / `4`;
123	num_loops = DIV_ROUND_UP(size_in_dw, `0xfffff`);
124	r = radeon_ring_lock(rdev, cp: ring, ndw: num_loops * `5` + `11`);
125	if (r) {
126	DRM_ERROR("radeon: moving bo (%d).\n", r);
127	radeon_sync_free(rdev, sync: &sync, NULL);
128	return ERR_PTR(error: r);
129	}
130
131	radeon_sync_resv(rdev, sync: &sync, resv, shared: false);
132	radeon_sync_rings(rdev, sync: &sync, waiting_ring: ring->idx);
133
134	for (i = `0`; i < num_loops; i++) {
135	cur_size_in_dw = size_in_dw;
136	if (cur_size_in_dw > `0xFFFFF`)
137	cur_size_in_dw = `0xFFFFF`;
138	size_in_dw -= cur_size_in_dw;
139	radeon_ring_write(ring, DMA_PACKET(DMA_PACKET_COPY, `0`, cur_size_in_dw));
140	radeon_ring_write(ring, v: dst_offset & `0xfffffffc`);
141	radeon_ring_write(ring, v: src_offset & `0xfffffffc`);
142	radeon_ring_write(ring, upper_32_bits(dst_offset) & `0xff`);
143	radeon_ring_write(ring, upper_32_bits(src_offset) & `0xff`);
144	src_offset += cur_size_in_dw * `4`;
145	dst_offset += cur_size_in_dw * `4`;
146	}
147
148	r = radeon_fence_emit(rdev, fence: &fence, ring: ring->idx);
149	if (r) {
150	radeon_ring_unlock_undo(rdev, cp: ring);
151	radeon_sync_free(rdev, sync: &sync, NULL);
152	return ERR_PTR(error: r);
153	}
154
155	radeon_ring_unlock_commit(rdev, cp: ring, hdp_flush: false);
156	radeon_sync_free(rdev, sync: &sync, fence);
157
158	return fence;
159	}
160
161	/**
162	* evergreen_dma_is_lockup - Check if the DMA engine is locked up
163	*
164	* @rdev: radeon_device pointer
165	* @ring: radeon_ring structure holding ring information
166	*
167	* Check if the async DMA engine is locked up.
168	* Returns true if the engine appears to be locked up, false if not.
169	*/
170	bool evergreen_dma_is_lockup(struct radeon_device rdev, struct* radeon_ring *ring)
171	{
172	u32 reset_mask = evergreen_gpu_check_soft_reset(rdev);
173
174	if (!(reset_mask & RADEON_RESET_DMA)) {
175	radeon_ring_lockup_update(rdev, ring);
176	return false;
177	}
178	return radeon_ring_test_lockup(rdev, ring);
179	}
180
181
182

source code of linux/drivers/gpu/drm/radeon/evergreen_dma.c