drm/etnaviv: move exec_state to submit object
[platform/kernel/linux-rpi.git] / drivers / gpu / drm / etnaviv / etnaviv_buffer.c
1 /*
2  * Copyright (C) 2014 Etnaviv Project
3  * Author: Christian Gmeiner <christian.gmeiner@gmail.com>
4  *
5  * This program is free software; you can redistribute it and/or modify it
6  * under the terms of the GNU General Public License version 2 as published by
7  * the Free Software Foundation.
8  *
9  * This program is distributed in the hope that it will be useful, but WITHOUT
10  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
12  * more details.
13  *
14  * You should have received a copy of the GNU General Public License along with
15  * this program.  If not, see <http://www.gnu.org/licenses/>.
16  */
17
18 #include "etnaviv_cmdbuf.h"
19 #include "etnaviv_gpu.h"
20 #include "etnaviv_gem.h"
21 #include "etnaviv_mmu.h"
22
23 #include "common.xml.h"
24 #include "state.xml.h"
25 #include "state_hi.xml.h"
26 #include "state_3d.xml.h"
27 #include "cmdstream.xml.h"
28
29 /*
30  * Command Buffer helper:
31  */
32
33
34 static inline void OUT(struct etnaviv_cmdbuf *buffer, u32 data)
35 {
36         u32 *vaddr = (u32 *)buffer->vaddr;
37
38         BUG_ON(buffer->user_size >= buffer->size);
39
40         vaddr[buffer->user_size / 4] = data;
41         buffer->user_size += 4;
42 }
43
44 static inline void CMD_LOAD_STATE(struct etnaviv_cmdbuf *buffer,
45         u32 reg, u32 value)
46 {
47         u32 index = reg >> VIV_FE_LOAD_STATE_HEADER_OFFSET__SHR;
48
49         buffer->user_size = ALIGN(buffer->user_size, 8);
50
51         /* write a register via cmd stream */
52         OUT(buffer, VIV_FE_LOAD_STATE_HEADER_OP_LOAD_STATE |
53                     VIV_FE_LOAD_STATE_HEADER_COUNT(1) |
54                     VIV_FE_LOAD_STATE_HEADER_OFFSET(index));
55         OUT(buffer, value);
56 }
57
58 static inline void CMD_END(struct etnaviv_cmdbuf *buffer)
59 {
60         buffer->user_size = ALIGN(buffer->user_size, 8);
61
62         OUT(buffer, VIV_FE_END_HEADER_OP_END);
63 }
64
65 static inline void CMD_WAIT(struct etnaviv_cmdbuf *buffer)
66 {
67         buffer->user_size = ALIGN(buffer->user_size, 8);
68
69         OUT(buffer, VIV_FE_WAIT_HEADER_OP_WAIT | 200);
70 }
71
72 static inline void CMD_LINK(struct etnaviv_cmdbuf *buffer,
73         u16 prefetch, u32 address)
74 {
75         buffer->user_size = ALIGN(buffer->user_size, 8);
76
77         OUT(buffer, VIV_FE_LINK_HEADER_OP_LINK |
78                     VIV_FE_LINK_HEADER_PREFETCH(prefetch));
79         OUT(buffer, address);
80 }
81
82 static inline void CMD_STALL(struct etnaviv_cmdbuf *buffer,
83         u32 from, u32 to)
84 {
85         buffer->user_size = ALIGN(buffer->user_size, 8);
86
87         OUT(buffer, VIV_FE_STALL_HEADER_OP_STALL);
88         OUT(buffer, VIV_FE_STALL_TOKEN_FROM(from) | VIV_FE_STALL_TOKEN_TO(to));
89 }
90
91 static inline void CMD_SEM(struct etnaviv_cmdbuf *buffer, u32 from, u32 to)
92 {
93         CMD_LOAD_STATE(buffer, VIVS_GL_SEMAPHORE_TOKEN,
94                        VIVS_GL_SEMAPHORE_TOKEN_FROM(from) |
95                        VIVS_GL_SEMAPHORE_TOKEN_TO(to));
96 }
97
98 static void etnaviv_cmd_select_pipe(struct etnaviv_gpu *gpu,
99         struct etnaviv_cmdbuf *buffer, u8 pipe)
100 {
101         u32 flush = 0;
102
103         lockdep_assert_held(&gpu->lock);
104
105         /*
106          * This assumes that if we're switching to 2D, we're switching
107          * away from 3D, and vice versa.  Hence, if we're switching to
108          * the 2D core, we need to flush the 3D depth and color caches,
109          * otherwise we need to flush the 2D pixel engine cache.
110          */
111         if (gpu->exec_state == ETNA_PIPE_2D)
112                 flush = VIVS_GL_FLUSH_CACHE_PE2D;
113         else if (gpu->exec_state == ETNA_PIPE_3D)
114                 flush = VIVS_GL_FLUSH_CACHE_DEPTH | VIVS_GL_FLUSH_CACHE_COLOR;
115
116         CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
117         CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
118         CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
119
120         CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
121                        VIVS_GL_PIPE_SELECT_PIPE(pipe));
122 }
123
124 static void etnaviv_buffer_dump(struct etnaviv_gpu *gpu,
125         struct etnaviv_cmdbuf *buf, u32 off, u32 len)
126 {
127         u32 size = buf->size;
128         u32 *ptr = buf->vaddr + off;
129
130         dev_info(gpu->dev, "virt %p phys 0x%08x free 0x%08x\n",
131                         ptr, etnaviv_cmdbuf_get_va(buf) + off, size - len * 4 - off);
132
133         print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
134                         ptr, len * 4, 0);
135 }
136
137 /*
138  * Safely replace the WAIT of a waitlink with a new command and argument.
139  * The GPU may be executing this WAIT while we're modifying it, so we have
140  * to write it in a specific order to avoid the GPU branching to somewhere
141  * else.  'wl_offset' is the offset to the first byte of the WAIT command.
142  */
143 static void etnaviv_buffer_replace_wait(struct etnaviv_cmdbuf *buffer,
144         unsigned int wl_offset, u32 cmd, u32 arg)
145 {
146         u32 *lw = buffer->vaddr + wl_offset;
147
148         lw[1] = arg;
149         mb();
150         lw[0] = cmd;
151         mb();
152 }
153
154 /*
155  * Ensure that there is space in the command buffer to contiguously write
156  * 'cmd_dwords' 64-bit words into the buffer, wrapping if necessary.
157  */
158 static u32 etnaviv_buffer_reserve(struct etnaviv_gpu *gpu,
159         struct etnaviv_cmdbuf *buffer, unsigned int cmd_dwords)
160 {
161         if (buffer->user_size + cmd_dwords * sizeof(u64) > buffer->size)
162                 buffer->user_size = 0;
163
164         return etnaviv_cmdbuf_get_va(buffer) + buffer->user_size;
165 }
166
167 u16 etnaviv_buffer_init(struct etnaviv_gpu *gpu)
168 {
169         struct etnaviv_cmdbuf *buffer = gpu->buffer;
170
171         lockdep_assert_held(&gpu->lock);
172
173         /* initialize buffer */
174         buffer->user_size = 0;
175
176         CMD_WAIT(buffer);
177         CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
178                  buffer->user_size - 4);
179
180         return buffer->user_size / 8;
181 }
182
183 u16 etnaviv_buffer_config_mmuv2(struct etnaviv_gpu *gpu, u32 mtlb_addr, u32 safe_addr)
184 {
185         struct etnaviv_cmdbuf *buffer = gpu->buffer;
186
187         lockdep_assert_held(&gpu->lock);
188
189         buffer->user_size = 0;
190
191         if (gpu->identity.features & chipFeatures_PIPE_3D) {
192                 CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
193                                VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_3D));
194                 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
195                         mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
196                 CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
197                 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
198                 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
199         }
200
201         if (gpu->identity.features & chipFeatures_PIPE_2D) {
202                 CMD_LOAD_STATE(buffer, VIVS_GL_PIPE_SELECT,
203                                VIVS_GL_PIPE_SELECT_PIPE(ETNA_PIPE_2D));
204                 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
205                         mtlb_addr | VIVS_MMUv2_CONFIGURATION_MODE_MODE4_K);
206                 CMD_LOAD_STATE(buffer, VIVS_MMUv2_SAFE_ADDRESS, safe_addr);
207                 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
208                 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
209         }
210
211         CMD_END(buffer);
212
213         buffer->user_size = ALIGN(buffer->user_size, 8);
214
215         return buffer->user_size / 8;
216 }
217
218 void etnaviv_buffer_end(struct etnaviv_gpu *gpu)
219 {
220         struct etnaviv_cmdbuf *buffer = gpu->buffer;
221         unsigned int waitlink_offset = buffer->user_size - 16;
222         u32 link_target, flush = 0;
223
224         lockdep_assert_held(&gpu->lock);
225
226         if (gpu->exec_state == ETNA_PIPE_2D)
227                 flush = VIVS_GL_FLUSH_CACHE_PE2D;
228         else if (gpu->exec_state == ETNA_PIPE_3D)
229                 flush = VIVS_GL_FLUSH_CACHE_DEPTH |
230                         VIVS_GL_FLUSH_CACHE_COLOR |
231                         VIVS_GL_FLUSH_CACHE_TEXTURE |
232                         VIVS_GL_FLUSH_CACHE_TEXTUREVS |
233                         VIVS_GL_FLUSH_CACHE_SHADER_L2;
234
235         if (flush) {
236                 unsigned int dwords = 7;
237
238                 link_target = etnaviv_buffer_reserve(gpu, buffer, dwords);
239
240                 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
241                 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
242                 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE, flush);
243                 if (gpu->exec_state == ETNA_PIPE_3D)
244                         CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
245                                        VIVS_TS_FLUSH_CACHE_FLUSH);
246                 CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
247                 CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
248                 CMD_END(buffer);
249
250                 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
251                                             VIV_FE_LINK_HEADER_OP_LINK |
252                                             VIV_FE_LINK_HEADER_PREFETCH(dwords),
253                                             link_target);
254         } else {
255                 /* Replace the last link-wait with an "END" command */
256                 etnaviv_buffer_replace_wait(buffer, waitlink_offset,
257                                             VIV_FE_END_HEADER_OP_END, 0);
258         }
259 }
260
261 /* Append a 'sync point' to the ring buffer. */
262 void etnaviv_sync_point_queue(struct etnaviv_gpu *gpu, unsigned int event)
263 {
264         struct etnaviv_cmdbuf *buffer = gpu->buffer;
265         unsigned int waitlink_offset = buffer->user_size - 16;
266         u32 dwords, target;
267
268         lockdep_assert_held(&gpu->lock);
269
270         /*
271          * We need at most 3 dwords in the return target:
272          * 1 event + 1 end + 1 wait + 1 link.
273          */
274         dwords = 4;
275         target = etnaviv_buffer_reserve(gpu, buffer, dwords);
276
277         /* Signal sync point event */
278         CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
279                        VIVS_GL_EVENT_FROM_PE);
280
281         /* Stop the FE to 'pause' the GPU */
282         CMD_END(buffer);
283
284         /* Append waitlink */
285         CMD_WAIT(buffer);
286         CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
287                             buffer->user_size - 4);
288
289         /*
290          * Kick off the 'sync point' command by replacing the previous
291          * WAIT with a link to the address in the ring buffer.
292          */
293         etnaviv_buffer_replace_wait(buffer, waitlink_offset,
294                                     VIV_FE_LINK_HEADER_OP_LINK |
295                                     VIV_FE_LINK_HEADER_PREFETCH(dwords),
296                                     target);
297 }
298
299 /* Append a command buffer to the ring buffer. */
300 void etnaviv_buffer_queue(struct etnaviv_gpu *gpu, u32 exec_state,
301         unsigned int event, struct etnaviv_cmdbuf *cmdbuf)
302 {
303         struct etnaviv_cmdbuf *buffer = gpu->buffer;
304         unsigned int waitlink_offset = buffer->user_size - 16;
305         u32 return_target, return_dwords;
306         u32 link_target, link_dwords;
307         bool switch_context = gpu->exec_state != exec_state;
308
309         lockdep_assert_held(&gpu->lock);
310
311         if (drm_debug & DRM_UT_DRIVER)
312                 etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
313
314         link_target = etnaviv_cmdbuf_get_va(cmdbuf);
315         link_dwords = cmdbuf->size / 8;
316
317         /*
318          * If we need maintanence prior to submitting this buffer, we will
319          * need to append a mmu flush load state, followed by a new
320          * link to this buffer - a total of four additional words.
321          */
322         if (gpu->mmu->need_flush || switch_context) {
323                 u32 target, extra_dwords;
324
325                 /* link command */
326                 extra_dwords = 1;
327
328                 /* flush command */
329                 if (gpu->mmu->need_flush) {
330                         if (gpu->mmu->version == ETNAVIV_IOMMU_V1)
331                                 extra_dwords += 1;
332                         else
333                                 extra_dwords += 3;
334                 }
335
336                 /* pipe switch commands */
337                 if (switch_context)
338                         extra_dwords += 4;
339
340                 target = etnaviv_buffer_reserve(gpu, buffer, extra_dwords);
341
342                 if (gpu->mmu->need_flush) {
343                         /* Add the MMU flush */
344                         if (gpu->mmu->version == ETNAVIV_IOMMU_V1) {
345                                 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_MMU,
346                                                VIVS_GL_FLUSH_MMU_FLUSH_FEMMU |
347                                                VIVS_GL_FLUSH_MMU_FLUSH_UNK1 |
348                                                VIVS_GL_FLUSH_MMU_FLUSH_UNK2 |
349                                                VIVS_GL_FLUSH_MMU_FLUSH_PEMMU |
350                                                VIVS_GL_FLUSH_MMU_FLUSH_UNK4);
351                         } else {
352                                 CMD_LOAD_STATE(buffer, VIVS_MMUv2_CONFIGURATION,
353                                         VIVS_MMUv2_CONFIGURATION_MODE_MASK |
354                                         VIVS_MMUv2_CONFIGURATION_ADDRESS_MASK |
355                                         VIVS_MMUv2_CONFIGURATION_FLUSH_FLUSH);
356                                 CMD_SEM(buffer, SYNC_RECIPIENT_FE,
357                                         SYNC_RECIPIENT_PE);
358                                 CMD_STALL(buffer, SYNC_RECIPIENT_FE,
359                                         SYNC_RECIPIENT_PE);
360                         }
361
362                         gpu->mmu->need_flush = false;
363                 }
364
365                 if (switch_context) {
366                         etnaviv_cmd_select_pipe(gpu, buffer, exec_state);
367                         gpu->exec_state = exec_state;
368                 }
369
370                 /* And the link to the submitted buffer */
371                 CMD_LINK(buffer, link_dwords, link_target);
372
373                 /* Update the link target to point to above instructions */
374                 link_target = target;
375                 link_dwords = extra_dwords;
376         }
377
378         /*
379          * Append a LINK to the submitted command buffer to return to
380          * the ring buffer.  return_target is the ring target address.
381          * We need at most 7 dwords in the return target: 2 cache flush +
382          * 2 semaphore stall + 1 event + 1 wait + 1 link.
383          */
384         return_dwords = 7;
385         return_target = etnaviv_buffer_reserve(gpu, buffer, return_dwords);
386         CMD_LINK(cmdbuf, return_dwords, return_target);
387
388         /*
389          * Append a cache flush, stall, event, wait and link pointing back to
390          * the wait command to the ring buffer.
391          */
392         if (gpu->exec_state == ETNA_PIPE_2D) {
393                 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
394                                        VIVS_GL_FLUSH_CACHE_PE2D);
395         } else {
396                 CMD_LOAD_STATE(buffer, VIVS_GL_FLUSH_CACHE,
397                                        VIVS_GL_FLUSH_CACHE_DEPTH |
398                                        VIVS_GL_FLUSH_CACHE_COLOR);
399                 CMD_LOAD_STATE(buffer, VIVS_TS_FLUSH_CACHE,
400                                        VIVS_TS_FLUSH_CACHE_FLUSH);
401         }
402         CMD_SEM(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
403         CMD_STALL(buffer, SYNC_RECIPIENT_FE, SYNC_RECIPIENT_PE);
404         CMD_LOAD_STATE(buffer, VIVS_GL_EVENT, VIVS_GL_EVENT_EVENT_ID(event) |
405                        VIVS_GL_EVENT_FROM_PE);
406         CMD_WAIT(buffer);
407         CMD_LINK(buffer, 2, etnaviv_cmdbuf_get_va(buffer) +
408                             buffer->user_size - 4);
409
410         if (drm_debug & DRM_UT_DRIVER)
411                 pr_info("stream link to 0x%08x @ 0x%08x %p\n",
412                         return_target, etnaviv_cmdbuf_get_va(cmdbuf),
413                         cmdbuf->vaddr);
414
415         if (drm_debug & DRM_UT_DRIVER) {
416                 print_hex_dump(KERN_INFO, "cmd ", DUMP_PREFIX_OFFSET, 16, 4,
417                                cmdbuf->vaddr, cmdbuf->size, 0);
418
419                 pr_info("link op: %p\n", buffer->vaddr + waitlink_offset);
420                 pr_info("addr: 0x%08x\n", link_target);
421                 pr_info("back: 0x%08x\n", return_target);
422                 pr_info("event: %d\n", event);
423         }
424
425         /*
426          * Kick off the submitted command by replacing the previous
427          * WAIT with a link to the address in the ring buffer.
428          */
429         etnaviv_buffer_replace_wait(buffer, waitlink_offset,
430                                     VIV_FE_LINK_HEADER_OP_LINK |
431                                     VIV_FE_LINK_HEADER_PREFETCH(link_dwords),
432                                     link_target);
433
434         if (drm_debug & DRM_UT_DRIVER)
435                 etnaviv_buffer_dump(gpu, buffer, 0, 0x50);
436
437         gpu->lastctx = cmdbuf->ctx;
438 }