2 * Copyright © 2010-2011 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sub license, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
12 * The above copyright notice and this permission notice (including the
13 * next paragraph) shall be included in all copies or substantial portions
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
17 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
19 * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR
20 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
21 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
22 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 * Zhou Chang <chang.zhou@intel.com>
35 #include "intel_batchbuffer.h"
36 #include "i965_defines.h"
37 #include "i965_structs.h"
38 #include "i965_drv_video.h"
39 #include "i965_encoder.h"
42 gen6_mfc_pipe_mode_select(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
44 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
46 BEGIN_BCS_BATCH(batch, 4);
48 OUT_BCS_BATCH(batch, MFX_PIPE_MODE_SELECT | (4 - 2));
50 (0 << 10) | /* disable Stream-Out , advanced QP/bitrate control need enable it*/
51 (1 << 9) | /* Post Deblocking Output */
52 (0 << 8) | /* Pre Deblocking Output */
53 (0 << 7) | /* disable TLB prefectch */
54 (0 << 5) | /* not in stitch mode */
55 (1 << 4) | /* encoding mode */
56 (2 << 0)); /* Standard Select: AVC */
58 (0 << 20) | /* round flag in PB slice */
59 (0 << 19) | /* round flag in Intra8x8 */
60 (0 << 7) | /* expand NOA bus flag */
61 (1 << 6) | /* must be 1 */
62 (0 << 5) | /* disable clock gating for NOA */
63 (0 << 4) | /* terminate if AVC motion and POC table error occurs */
64 (0 << 3) | /* terminate if AVC mbdata error occurs */
65 (0 << 2) | /* terminate if AVC CABAC/CAVLC decode error occurs */
66 (0 << 1) | /* AVC long field motion vector */
67 (0 << 0)); /* always calculate AVC ILDB boundary strength */
68 OUT_BCS_BATCH(batch, 0);
70 ADVANCE_BCS_BATCH(batch);
74 gen7_mfc_pipe_mode_select(VADriverContextP ctx,
76 struct gen6_encoder_context *gen6_encoder_context)
78 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
80 assert(standard_select == MFX_FORMAT_MPEG2 ||
81 standard_select == MFX_FORMAT_AVC);
83 BEGIN_BCS_BATCH(batch, 5);
84 OUT_BCS_BATCH(batch, MFX_PIPE_MODE_SELECT | (5 - 2));
86 (MFX_LONG_MODE << 17) | /* Must be long format for encoder */
87 (MFD_MODE_VLD << 15) | /* VLD mode */
88 (0 << 10) | /* disable Stream-Out */
89 (1 << 9) | /* Post Deblocking Output */
90 (0 << 8) | /* Pre Deblocking Output */
91 (0 << 5) | /* not in stitch mode */
92 (1 << 4) | /* encoding mode */
93 (standard_select << 0)); /* standard select: avc or mpeg2 */
95 (0 << 7) | /* expand NOA bus flag */
96 (0 << 6) | /* disable slice-level clock gating */
97 (0 << 5) | /* disable clock gating for NOA */
98 (0 << 4) | /* terminate if AVC motion and POC table error occurs */
99 (0 << 3) | /* terminate if AVC mbdata error occurs */
100 (0 << 2) | /* terminate if AVC CABAC/CAVLC decode error occurs */
103 OUT_BCS_BATCH(batch, 0);
104 OUT_BCS_BATCH(batch, 0);
106 ADVANCE_BCS_BATCH(batch);
110 gen6_mfc_surface_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
112 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
113 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
115 BEGIN_BCS_BATCH(batch, 6);
117 OUT_BCS_BATCH(batch, MFX_SURFACE_STATE | (6 - 2));
118 OUT_BCS_BATCH(batch, 0);
120 ((mfc_context->surface_state.height - 1) << 19) |
121 ((mfc_context->surface_state.width - 1) << 6));
123 (MFX_SURFACE_PLANAR_420_8 << 28) | /* 420 planar YUV surface */
124 (1 << 27) | /* must be 1 for interleave U/V, hardware requirement */
125 (0 << 22) | /* surface object control state, FIXME??? */
126 ((mfc_context->surface_state.w_pitch - 1) << 3) | /* pitch */
127 (0 << 2) | /* must be 0 for interleave U/V */
128 (1 << 1) | /* must be y-tiled */
129 (I965_TILEWALK_YMAJOR << 0)); /* tile walk, TILEWALK_YMAJOR */
131 (0 << 16) | /* must be 0 for interleave U/V */
132 (mfc_context->surface_state.h_pitch)); /* y offset for U(cb) */
133 OUT_BCS_BATCH(batch, 0);
134 ADVANCE_BCS_BATCH(batch);
138 gen7_mfc_surface_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
140 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
141 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
143 BEGIN_BCS_BATCH(batch, 6);
145 OUT_BCS_BATCH(batch, MFX_SURFACE_STATE | (6 - 2));
146 OUT_BCS_BATCH(batch, 0);
148 ((mfc_context->surface_state.height - 1) << 18) |
149 ((mfc_context->surface_state.width - 1) << 4));
151 (MFX_SURFACE_PLANAR_420_8 << 28) | /* 420 planar YUV surface */
152 (1 << 27) | /* must be 1 for interleave U/V, hardware requirement */
153 (0 << 22) | /* surface object control state, FIXME??? */
154 ((mfc_context->surface_state.w_pitch - 1) << 3) | /* pitch */
155 (0 << 2) | /* must be 0 for interleave U/V */
156 (1 << 1) | /* must be tiled */
157 (I965_TILEWALK_YMAJOR << 0)); /* tile walk, TILEWALK_YMAJOR */
159 (0 << 16) | /* must be 0 for interleave U/V */
160 (mfc_context->surface_state.h_pitch)); /* y offset for U(cb) */
161 OUT_BCS_BATCH(batch, 0);
162 ADVANCE_BCS_BATCH(batch);
166 gen6_mfc_pipe_buf_addr_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
168 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
169 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
172 BEGIN_BCS_BATCH(batch, 24);
174 OUT_BCS_BATCH(batch, MFX_PIPE_BUF_ADDR_STATE | (24 - 2));
176 OUT_BCS_BATCH(batch, 0); /* pre output addr */
178 OUT_BCS_RELOC(batch, mfc_context->post_deblocking_output.bo,
179 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
180 0); /* post output addr */
182 OUT_BCS_RELOC(batch, mfc_context->uncompressed_picture_source.bo,
183 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
184 0); /* uncompressed data */
185 OUT_BCS_RELOC(batch, mfc_context->macroblock_status_buffer.bo,
186 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
187 0); /* StreamOut data*/
188 OUT_BCS_RELOC(batch, mfc_context->intra_row_store_scratch_buffer.bo,
189 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
191 OUT_BCS_RELOC(batch, mfc_context->deblocking_filter_row_store_scratch_buffer.bo,
192 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
194 /* 7..22 Reference pictures*/
195 for (i = 0; i < ARRAY_ELEMS(mfc_context->reference_surfaces); i++) {
196 if ( mfc_context->reference_surfaces[i].bo != NULL) {
197 OUT_BCS_RELOC(batch, mfc_context->reference_surfaces[i].bo,
198 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
201 OUT_BCS_BATCH(batch, 0);
204 OUT_BCS_RELOC(batch, mfc_context->macroblock_status_buffer.bo,
205 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
206 0); /* Macroblock status buffer*/
208 ADVANCE_BCS_BATCH(batch);
212 gen6_mfc_ind_obj_base_addr_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
214 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
215 struct gen6_vme_context *vme_context = &gen6_encoder_context->vme_context;
217 BEGIN_BCS_BATCH(batch, 11);
219 OUT_BCS_BATCH(batch, MFX_IND_OBJ_BASE_ADDR_STATE | (11 - 2));
220 OUT_BCS_BATCH(batch, 0);
221 OUT_BCS_BATCH(batch, 0);
222 /* MFX Indirect MV Object Base Address */
223 OUT_BCS_RELOC(batch, vme_context->vme_output.bo, I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
224 OUT_BCS_BATCH(batch, 0);
225 OUT_BCS_BATCH(batch, 0);
226 OUT_BCS_BATCH(batch, 0);
227 OUT_BCS_BATCH(batch, 0);
228 OUT_BCS_BATCH(batch, 0);
229 /*MFC Indirect PAK-BSE Object Base Address for Encoder*/
230 OUT_BCS_BATCH(batch, 0);
231 OUT_BCS_BATCH(batch, 0);
233 ADVANCE_BCS_BATCH(batch);
237 gen7_mfc_ind_obj_base_addr_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
239 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
240 struct gen6_vme_context *vme_context = &gen6_encoder_context->vme_context;
242 BEGIN_BCS_BATCH(batch, 11);
244 OUT_BCS_BATCH(batch, MFX_IND_OBJ_BASE_ADDR_STATE | (11 - 2));
245 OUT_BCS_BATCH(batch, 0);
246 OUT_BCS_BATCH(batch, 0);
247 /* MFX Indirect MV Object Base Address */
248 OUT_BCS_RELOC(batch, vme_context->vme_output.bo, I915_GEM_DOMAIN_INSTRUCTION, 0, 0);
249 OUT_BCS_BATCH(batch, 0x80000000); /* must set, up to 2G */
250 OUT_BCS_BATCH(batch, 0);
251 OUT_BCS_BATCH(batch, 0);
252 OUT_BCS_BATCH(batch, 0);
253 OUT_BCS_BATCH(batch, 0);
254 /*MFC Indirect PAK-BSE Object Base Address for Encoder*/
255 OUT_BCS_BATCH(batch, 0);
256 OUT_BCS_BATCH(batch, 0x80000000); /* must set, up to 2G */
258 ADVANCE_BCS_BATCH(batch);
262 gen6_mfc_bsp_buf_base_addr_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
264 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
265 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
267 BEGIN_BCS_BATCH(batch, 4);
269 OUT_BCS_BATCH(batch, MFX_BSP_BUF_BASE_ADDR_STATE | (4 - 2));
270 OUT_BCS_RELOC(batch, mfc_context->bsd_mpc_row_store_scratch_buffer.bo,
271 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
273 OUT_BCS_BATCH(batch, 0);
274 OUT_BCS_BATCH(batch, 0);
276 ADVANCE_BCS_BATCH(batch);
280 gen6_mfc_avc_img_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
282 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
283 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
285 int width_in_mbs = (mfc_context->surface_state.width + 15) / 16;
286 int height_in_mbs = (mfc_context->surface_state.height + 15) / 16;
288 BEGIN_BCS_BATCH(batch, 13);
289 OUT_BCS_BATCH(batch, MFX_AVC_IMG_STATE | (13 - 2));
291 ((width_in_mbs * height_in_mbs) & 0xFFFF));
293 (height_in_mbs << 16) |
294 (width_in_mbs << 0));
296 (0 << 24) | /*Second Chroma QP Offset*/
297 (0 << 16) | /*Chroma QP Offset*/
298 (0 << 14) | /*Max-bit conformance Intra flag*/
299 (0 << 13) | /*Max Macroblock size conformance Inter flag*/
300 (1 << 12) | /*Should always be written as "1" */
301 (0 << 10) | /*QM Preset FLag */
302 (0 << 8) | /*Image Structure*/
303 (0 << 0) ); /*Current Decoed Image Frame Store ID, reserved in Encode mode*/
305 (400 << 16) | /*Mininum Frame size*/
306 (0 << 15) | /*Disable reading of Macroblock Status Buffer*/
307 (0 << 14) | /*Load BitStream Pointer only once, 1 slic 1 frame*/
308 (0 << 13) | /*CABAC 0 word insertion test enable*/
309 (1 << 12) | /*MVUnpackedEnable,compliant to DXVA*/
310 (1 << 10) | /*Chroma Format IDC, 4:2:0*/
311 (1 << 7) | /*0:CAVLC encoding mode,1:CABAC*/
312 (0 << 6) | /*Only valid for VLD decoding mode*/
313 (0 << 5) | /*Constrained Intra Predition Flag, from PPS*/
314 (0 << 4) | /*Direct 8x8 inference flag*/
315 (0 << 3) | /*Only 8x8 IDCT Transform Mode Flag*/
316 (1 << 2) | /*Frame MB only flag*/
317 (0 << 1) | /*MBAFF mode is in active*/
318 (0 << 0) ); /*Field picture flag*/
320 (1<<16) | /*Frame Size Rate Control Flag*/
322 (1<<9) | /*MB level Rate Control Enabling Flag*/
323 (1 << 3) | /*FrameBitRateMinReportMask*/
324 (1 << 2) | /*FrameBitRateMaxReportMask*/
325 (1 << 1) | /*InterMBMaxSizeReportMask*/
326 (1 << 0) ); /*IntraMBMaxSizeReportMask*/
327 OUT_BCS_BATCH(batch, /*Inter and Intra Conformance Max size limit*/
328 (0x0600 << 16) | /*InterMbMaxSz 192 Byte*/
329 (0x0800) ); /*IntraMbMaxSz 256 Byte*/
330 OUT_BCS_BATCH(batch, 0x00000000); /*Reserved : MBZReserved*/
331 OUT_BCS_BATCH(batch, 0x01020304); /*Slice QP Delta for bitrate control*/
332 OUT_BCS_BATCH(batch, 0xFEFDFCFB);
333 OUT_BCS_BATCH(batch, 0x80601004); /*MAX = 128KB, MIN = 64KB*/
334 OUT_BCS_BATCH(batch, 0x00800001);
335 OUT_BCS_BATCH(batch, 0);
337 ADVANCE_BCS_BATCH(batch);
341 gen7_mfc_avc_img_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
343 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
344 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
346 int width_in_mbs = (mfc_context->surface_state.width + 15) / 16;
347 int height_in_mbs = (mfc_context->surface_state.height + 15) / 16;
349 BEGIN_BCS_BATCH(batch, 16);
350 OUT_BCS_BATCH(batch, MFX_AVC_IMG_STATE | (16 - 2));
352 ((width_in_mbs * height_in_mbs) & 0xFFFF));
354 ((height_in_mbs - 1) << 16) |
355 ((width_in_mbs - 1) << 0));
357 (0 << 24) | /* Second Chroma QP Offset */
358 (0 << 16) | /* Chroma QP Offset */
359 (0 << 14) | /* Max-bit conformance Intra flag */
360 (0 << 13) | /* Max Macroblock size conformance Inter flag */
361 (0 << 12) | /* FIXME: Weighted_Pred_Flag */
362 (0 << 10) | /* FIXME: Weighted_BiPred_Idc */
363 (0 << 8) | /* FIXME: Image Structure */
364 (0 << 0) ); /* Current Decoed Image Frame Store ID, reserved in Encode mode */
366 (0 << 16) | /* Mininum Frame size */
367 (0 << 15) | /* Disable reading of Macroblock Status Buffer */
368 (0 << 14) | /* Load BitStream Pointer only once, 1 slic 1 frame */
369 (0 << 13) | /* CABAC 0 word insertion test enable */
370 (1 << 12) | /* MVUnpackedEnable,compliant to DXVA */
371 (1 << 10) | /* Chroma Format IDC, 4:2:0 */
372 (0 << 9) | /* FIXME: MbMvFormatFlag */
373 (1 << 7) | /* 0:CAVLC encoding mode,1:CABAC */
374 (0 << 6) | /* Only valid for VLD decoding mode */
375 (0 << 5) | /* Constrained Intra Predition Flag, from PPS */
376 (0 << 4) | /* Direct 8x8 inference flag */
377 (0 << 3) | /* Only 8x8 IDCT Transform Mode Flag */
378 (1 << 2) | /* Frame MB only flag */
379 (0 << 1) | /* MBAFF mode is in active */
380 (0 << 0)); /* Field picture flag */
381 OUT_BCS_BATCH(batch, 0); /* Mainly about MB rate control and debug, just ignoring */
382 OUT_BCS_BATCH(batch, /* Inter and Intra Conformance Max size limit */
383 (0xBB8 << 16) | /* InterMbMaxSz */
384 (0xEE8) ); /* IntraMbMaxSz */
385 OUT_BCS_BATCH(batch, 0); /* Reserved */
386 OUT_BCS_BATCH(batch, 0); /* Slice QP Delta for bitrate control */
387 OUT_BCS_BATCH(batch, 0); /* Slice QP Delta for bitrate control */
388 OUT_BCS_BATCH(batch, 0x8C000000);
389 OUT_BCS_BATCH(batch, 0x00010000);
390 OUT_BCS_BATCH(batch, 0);
391 OUT_BCS_BATCH(batch, 0);
392 OUT_BCS_BATCH(batch, 0);
393 OUT_BCS_BATCH(batch, 0);
395 ADVANCE_BCS_BATCH(batch);
398 static void gen6_mfc_avc_directmode_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
400 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
403 BEGIN_BCS_BATCH(batch, 69);
405 OUT_BCS_BATCH(batch, MFX_AVC_DIRECTMODE_STATE | (69 - 2));
406 //TODO: reference DMV
407 for(i = 0; i < 16; i++){
408 OUT_BCS_BATCH(batch, 0);
409 OUT_BCS_BATCH(batch, 0);
412 //TODO: current DMV just for test
414 OUT_BCS_RELOC(batch, mfc_context->direct_mv_buffers[0].bo,
415 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
418 //drm_intel_bo_pin(mfc_context->direct_mv_buffers[0].bo, 0x1000);
419 //OUT_BCS_BATCH(batch, mfc_context->direct_mv_buffers[0].bo->offset);
420 OUT_BCS_BATCH(batch, 0);
424 OUT_BCS_BATCH(batch, 0);
427 for(i = 0; i < 34; i++) {
428 OUT_BCS_BATCH(batch, 0);
431 ADVANCE_BCS_BATCH(batch);
434 static void gen6_mfc_avc_slice_state(VADriverContextP ctx,
436 struct gen6_encoder_context *gen6_encoder_context,
437 int rate_control_enable)
439 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
440 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
442 BEGIN_BCS_BATCH(batch, 11);;
444 OUT_BCS_BATCH(batch, MFX_AVC_SLICE_STATE | (11 - 2) );
446 OUT_BCS_BATCH(batch, slice_type); /*Slice Type: I:P:B Slice*/
448 if ( slice_type == SLICE_TYPE_I )
449 OUT_BCS_BATCH(batch, 0); /*no reference frames and pred_weight_table*/
451 OUT_BCS_BATCH(batch, 0x00010000); /*1 reference frame*/
453 OUT_BCS_BATCH(batch, (0<<24) | /*Enable deblocking operation*/
454 (26<<16) | /*Slice Quantization Parameter*/
456 OUT_BCS_BATCH(batch, 0); /*First MB X&Y , the postion of current slice*/
457 OUT_BCS_BATCH(batch, ( ((mfc_context->surface_state.height+15)/16) << 16) );
460 (rate_control_enable<<31) | /*in CBR mode RateControlCounterEnable = enable*/
461 (1<<30) | /*ResetRateControlCounter*/
462 (0<<28) | /*RC Triggle Mode = Always Rate Control*/
463 (8<<24) | /*RC Stable Tolerance, middle level*/
464 (rate_control_enable<<23) | /*RC Panic Enable*/
465 (0<<22) | /*QP mode, don't modfiy CBP*/
466 (1<<19) | /*IsLastSlice*/
467 (0<<18) | /*BitstreamOutputFlag Compressed BitStream Output Disable Flag 0:enable 1:disable*/
468 (0<<17) | /*HeaderPresentFlag*/
469 (1<<16) | /*SliceData PresentFlag*/
470 (0<<15) | /*TailPresentFlag*/
471 (1<<13) | /*RBSP NAL TYPE*/
472 (0<<12) ); /*CabacZeroWordInsertionEnable*/
474 OUT_BCS_RELOC(batch, mfc_context->mfc_indirect_pak_bse_object.bo,
475 I915_GEM_DOMAIN_INSTRUCTION, I915_GEM_DOMAIN_INSTRUCTION,
476 mfc_context->mfc_indirect_pak_bse_object.offset);
478 OUT_BCS_BATCH(batch, (24<<24) | /*Target QP - 24 is lowest QP*/
479 (20<<16) | /*Target QP + 20 is highest QP*/
484 OUT_BCS_BATCH(batch, 0x08888888);
485 OUT_BCS_BATCH(batch, 0);
487 ADVANCE_BCS_BATCH(batch);
489 static void gen6_mfc_avc_qm_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
491 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
494 BEGIN_BCS_BATCH(batch, 58);
496 OUT_BCS_BATCH(batch, MFX_AVC_QM_STATE | 56);
497 OUT_BCS_BATCH(batch, 0xFF ) ;
498 for( i = 0; i < 56; i++) {
499 OUT_BCS_BATCH(batch, 0x10101010);
502 ADVANCE_BCS_BATCH(batch);
505 static void gen6_mfc_avc_fqm_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
507 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
510 BEGIN_BCS_BATCH(batch, 113);
511 OUT_BCS_BATCH(batch, MFC_AVC_FQM_STATE | (113 - 2));
513 for(i = 0; i < 112;i++) {
514 OUT_BCS_BATCH(batch, 0x10001000);
517 ADVANCE_BCS_BATCH(batch);
521 gen7_mfc_qm_state(VADriverContextP ctx,
525 struct gen6_encoder_context *gen6_encoder_context)
527 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
528 unsigned int qm_buffer[16];
530 assert(qm_length <= 16);
531 assert(sizeof(*qm) == 4);
532 memcpy(qm_buffer, qm, qm_length * 4);
534 BEGIN_BCS_BATCH(batch, 18);
535 OUT_BCS_BATCH(batch, MFX_QM_STATE | (18 - 2));
536 OUT_BCS_BATCH(batch, qm_type << 0);
537 intel_batchbuffer_data(batch, qm_buffer, 16 * 4);
538 ADVANCE_BCS_BATCH(batch);
541 static void gen7_mfc_avc_qm_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
543 unsigned int qm[16] = {
544 0x10101010, 0x10101010, 0x10101010, 0x10101010,
545 0x10101010, 0x10101010, 0x10101010, 0x10101010,
546 0x10101010, 0x10101010, 0x10101010, 0x10101010,
547 0x10101010, 0x10101010, 0x10101010, 0x10101010
550 gen7_mfc_qm_state(ctx, MFX_QM_AVC_4X4_INTRA_MATRIX, qm, 12, gen6_encoder_context);
551 gen7_mfc_qm_state(ctx, MFX_QM_AVC_4X4_INTER_MATRIX, qm, 12, gen6_encoder_context);
552 gen7_mfc_qm_state(ctx, MFX_QM_AVC_8x8_INTRA_MATRIX, qm, 16, gen6_encoder_context);
553 gen7_mfc_qm_state(ctx, MFX_QM_AVC_8x8_INTER_MATRIX, qm, 16, gen6_encoder_context);
557 gen7_mfc_fqm_state(VADriverContextP ctx,
561 struct gen6_encoder_context *gen6_encoder_context)
563 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
564 unsigned int fqm_buffer[32];
566 assert(fqm_length <= 32);
567 assert(sizeof(*fqm) == 4);
568 memcpy(fqm_buffer, fqm, fqm_length * 4);
570 BEGIN_BCS_BATCH(batch, 34);
571 OUT_BCS_BATCH(batch, MFX_FQM_STATE | (34 - 2));
572 OUT_BCS_BATCH(batch, fqm_type << 0);
573 intel_batchbuffer_data(batch, fqm_buffer, 32 * 4);
574 ADVANCE_BCS_BATCH(batch);
577 static void gen7_mfc_avc_fqm_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
579 unsigned int qm[32] = {
580 0x10001000, 0x10001000, 0x10001000, 0x10001000,
581 0x10001000, 0x10001000, 0x10001000, 0x10001000,
582 0x10001000, 0x10001000, 0x10001000, 0x10001000,
583 0x10001000, 0x10001000, 0x10001000, 0x10001000,
584 0x10001000, 0x10001000, 0x10001000, 0x10001000,
585 0x10001000, 0x10001000, 0x10001000, 0x10001000,
586 0x10001000, 0x10001000, 0x10001000, 0x10001000,
587 0x10001000, 0x10001000, 0x10001000, 0x10001000
590 gen7_mfc_fqm_state(ctx, MFX_QM_AVC_4X4_INTRA_MATRIX, qm, 24, gen6_encoder_context);
591 gen7_mfc_fqm_state(ctx, MFX_QM_AVC_4X4_INTER_MATRIX, qm, 24, gen6_encoder_context);
592 gen7_mfc_fqm_state(ctx, MFX_QM_AVC_8x8_INTRA_MATRIX, qm, 32, gen6_encoder_context);
593 gen7_mfc_fqm_state(ctx, MFX_QM_AVC_8x8_INTER_MATRIX, qm, 32, gen6_encoder_context);
596 static void gen6_mfc_avc_ref_idx_state(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
598 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
601 BEGIN_BCS_BATCH(batch, 10);
602 OUT_BCS_BATCH(batch, MFX_AVC_REF_IDX_STATE | 8);
603 OUT_BCS_BATCH(batch, 0); //Select L0
604 OUT_BCS_BATCH(batch, 0x80808020); //Only 1 reference
605 for(i = 0; i < 7; i++) {
606 OUT_BCS_BATCH(batch, 0x80808080);
608 ADVANCE_BCS_BATCH(batch);
610 BEGIN_BCS_BATCH(batch, 10);
611 OUT_BCS_BATCH(batch, MFX_AVC_REF_IDX_STATE | 8);
612 OUT_BCS_BATCH(batch, 1); //Select L1
613 OUT_BCS_BATCH(batch, 0x80808022); //Only 1 reference
614 for(i = 0; i < 7; i++) {
615 OUT_BCS_BATCH(batch, 0x80808080);
617 ADVANCE_BCS_BATCH(batch);
621 gen6_mfc_avc_insert_object(VADriverContextP ctx, int flush_data, struct gen6_encoder_context *gen6_encoder_context)
623 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
625 BEGIN_BCS_BATCH(batch, 4);
627 OUT_BCS_BATCH(batch, MFC_AVC_INSERT_OBJECT | (4 -2 ) );
628 OUT_BCS_BATCH(batch, (32<<8) |
633 OUT_BCS_BATCH(batch, 0x00000003);
634 OUT_BCS_BATCH(batch, 0xABCD1234);
636 ADVANCE_BCS_BATCH(batch);
640 gen6_mfc_avc_pak_object_intra(VADriverContextP ctx, int x, int y, int end_mb, int qp,unsigned int *msg,
641 struct gen6_encoder_context *gen6_encoder_context,
642 int intra_mb_size_in_bits)
644 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
645 int len_in_dwords = 11;
646 unsigned char target_mb_size = intra_mb_size_in_bits / 16; //In Words
647 unsigned char max_mb_size = target_mb_size * 2 > 255? 255: target_mb_size * 2 ;
649 BEGIN_BCS_BATCH(batch, len_in_dwords);
651 OUT_BCS_BATCH(batch, MFC_AVC_PAK_OBJECT | (len_in_dwords - 2));
652 OUT_BCS_BATCH(batch, 0);
653 OUT_BCS_BATCH(batch, 0);
655 (0 << 24) | /* PackedMvNum, Debug*/
656 (0 << 20) | /* No motion vector */
657 (1 << 19) | /* CbpDcY */
658 (1 << 18) | /* CbpDcU */
659 (1 << 17) | /* CbpDcV */
662 OUT_BCS_BATCH(batch, (0xFFFF<<16) | (y << 8) | x); /* Code Block Pattern for Y*/
663 OUT_BCS_BATCH(batch, 0x000F000F); /* Code Block Pattern */
664 OUT_BCS_BATCH(batch, (0 << 27) | (end_mb << 26) | qp); /* Last MB */
666 /*Stuff for Intra MB*/
667 OUT_BCS_BATCH(batch, msg[1]); /* We using Intra16x16 no 4x4 predmode*/
668 OUT_BCS_BATCH(batch, msg[2]);
669 OUT_BCS_BATCH(batch, msg[3]&0xFC);
671 /*MaxSizeInWord and TargetSzieInWord*/
672 OUT_BCS_BATCH(batch, (max_mb_size << 24) |
673 (target_mb_size << 16) );
675 ADVANCE_BCS_BATCH(batch);
677 return len_in_dwords;
680 static int gen6_mfc_avc_pak_object_inter(VADriverContextP ctx, int x, int y, int end_mb, int qp, unsigned int offset,
681 struct gen6_encoder_context *gen6_encoder_context,
682 int inter_mb_size_in_bits)
684 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
685 int len_in_dwords = 11;
686 unsigned char target_mb_size = inter_mb_size_in_bits / 16; //In Words
687 unsigned char max_mb_size = target_mb_size * 16 > 255? 255: target_mb_size * 16 ;
689 BEGIN_BCS_BATCH(batch, len_in_dwords);
691 OUT_BCS_BATCH(batch, MFC_AVC_PAK_OBJECT | (len_in_dwords - 2));
693 OUT_BCS_BATCH(batch, 32); /* 32 MV*/
694 OUT_BCS_BATCH(batch, offset);
697 (1 << 24) | /* PackedMvNum, Debug*/
698 (4 << 20) | /* 8 MV, SNB don't use it*/
699 (1 << 19) | /* CbpDcY */
700 (1 << 18) | /* CbpDcU */
701 (1 << 17) | /* CbpDcV */
702 (0 << 15) | /* Transform8x8Flag = 0*/
703 (0 << 14) | /* Frame based*/
704 (0 << 13) | /* Inter MB */
705 (1 << 8) | /* MbType = P_L0_16x16 */
706 (0 << 7) | /* MBZ for frame */
708 (2 << 4) | /* MBZ for inter*/
710 (0 << 2) | /* SkipMbFlag */
711 (0 << 0)); /* InterMbMode */
713 OUT_BCS_BATCH(batch, (0xFFFF<<16) | (y << 8) | x); /* Code Block Pattern for Y*/
714 OUT_BCS_BATCH(batch, 0x000F000F); /* Code Block Pattern */
715 OUT_BCS_BATCH(batch, (0 << 27) | (end_mb << 26) | qp); /* Last MB */
717 /*Stuff for Inter MB*/
718 OUT_BCS_BATCH(batch, 0x0);
719 OUT_BCS_BATCH(batch, 0x0);
720 OUT_BCS_BATCH(batch, 0x0);
722 /*MaxSizeInWord and TargetSzieInWord*/
723 OUT_BCS_BATCH(batch, (max_mb_size << 24) |
724 (target_mb_size << 16) );
726 ADVANCE_BCS_BATCH(batch);
728 return len_in_dwords;
731 static void gen6_mfc_init(VADriverContextP ctx, struct gen6_encoder_context *gen6_encoder_context)
733 struct i965_driver_data *i965 = i965_driver_data(ctx);
734 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
738 /*Encode common setup for MFC*/
739 dri_bo_unreference(mfc_context->post_deblocking_output.bo);
740 mfc_context->post_deblocking_output.bo = NULL;
742 dri_bo_unreference(mfc_context->pre_deblocking_output.bo);
743 mfc_context->pre_deblocking_output.bo = NULL;
745 dri_bo_unreference(mfc_context->uncompressed_picture_source.bo);
746 mfc_context->uncompressed_picture_source.bo = NULL;
748 dri_bo_unreference(mfc_context->mfc_indirect_pak_bse_object.bo);
749 mfc_context->mfc_indirect_pak_bse_object.bo = NULL;
751 for (i = 0; i < NUM_MFC_DMV_BUFFERS; i++){
752 dri_bo_unreference(mfc_context->direct_mv_buffers[i].bo);
753 mfc_context->direct_mv_buffers[i].bo = NULL;
756 for (i = 0; i < MAX_MFC_REFERENCE_SURFACES; i++){
757 if (mfc_context->reference_surfaces[i].bo != NULL)
758 dri_bo_unreference(mfc_context->reference_surfaces[i].bo);
759 mfc_context->reference_surfaces[i].bo = NULL;
762 dri_bo_unreference(mfc_context->intra_row_store_scratch_buffer.bo);
763 bo = dri_bo_alloc(i965->intel.bufmgr,
768 mfc_context->intra_row_store_scratch_buffer.bo = bo;
770 dri_bo_unreference(mfc_context->macroblock_status_buffer.bo);
771 bo = dri_bo_alloc(i965->intel.bufmgr,
776 mfc_context->macroblock_status_buffer.bo = bo;
778 dri_bo_unreference(mfc_context->deblocking_filter_row_store_scratch_buffer.bo);
779 bo = dri_bo_alloc(i965->intel.bufmgr,
781 49152, /* 6 * 128 * 64 */
784 mfc_context->deblocking_filter_row_store_scratch_buffer.bo = bo;
786 dri_bo_unreference(mfc_context->bsd_mpc_row_store_scratch_buffer.bo);
787 bo = dri_bo_alloc(i965->intel.bufmgr,
789 12288, /* 1.5 * 128 * 64 */
792 mfc_context->bsd_mpc_row_store_scratch_buffer.bo = bo;
795 void gen6_mfc_avc_pipeline_programing(VADriverContextP ctx,
796 struct encode_state *encode_state,
797 struct gen6_encoder_context *gen6_encoder_context)
799 struct i965_driver_data *i965 = i965_driver_data(ctx);
800 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
801 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
802 struct gen6_vme_context *vme_context = &gen6_encoder_context->vme_context;
803 VAEncSequenceParameterBufferH264Ext *pSequenceParameter = (VAEncSequenceParameterBufferH264Ext *)encode_state->seq_param->buffer;
804 VAEncPictureParameterBufferH264Ext *pPicParameter = (VAEncPictureParameterBufferH264Ext *)encode_state->pic_param->buffer;
805 VAEncSliceParameterBufferH264Ext *pSliceParameter = (VAEncSliceParameterBufferH264Ext *)encode_state->slice_params[0]->buffer; /* FIXME: multi slices */
807 unsigned int *msg = NULL, offset = 0;
808 int emit_new_state = 1, object_len_in_bytes;
809 int is_intra = pSliceParameter->slice_type == SLICE_TYPE_I;
810 int width_in_mbs = (mfc_context->surface_state.width + 15) / 16;
811 int height_in_mbs = (mfc_context->surface_state.height + 15) / 16;
813 int rate_control_mode = pSequenceParameter->rate_control_method;
814 float fps = pSequenceParameter->time_scale * 0.5 / pSequenceParameter->num_units_in_tick ;
816 int inter_mb_size = pSequenceParameter->bits_per_second * 1.0 / fps / width_in_mbs / height_in_mbs;
817 int intra_mb_size = inter_mb_size * 5.0;
818 int qp = pPicParameter->pic_init_qp;
820 if ( rate_control_mode != 2) {
822 if ( intra_mb_size > 384*8) //ONE MB raw data is 384 bytes
823 intra_mb_size = 384*8;
824 if ( inter_mb_size > 256*8)
825 intra_mb_size = 256*8;
828 intel_batchbuffer_start_atomic_bcs(batch, 0x1000);
831 dri_bo_map(vme_context->vme_output.bo , 1);
832 msg = (unsigned int *)vme_context->vme_output.bo->virtual;
835 for (y = 0; y < height_in_mbs; y++) {
836 for (x = 0; x < width_in_mbs; x++) {
837 int last_mb = (y == (height_in_mbs-1)) && ( x == (width_in_mbs-1) );
839 if (emit_new_state) {
840 intel_batchbuffer_emit_mi_flush(batch);
842 if (IS_GEN7(i965->intel.device_id)) {
843 gen7_mfc_pipe_mode_select(ctx, MFX_FORMAT_AVC, gen6_encoder_context);
844 gen7_mfc_surface_state(ctx, gen6_encoder_context);
845 gen7_mfc_ind_obj_base_addr_state(ctx, gen6_encoder_context);
847 gen6_mfc_pipe_mode_select(ctx, gen6_encoder_context);
848 gen6_mfc_surface_state(ctx, gen6_encoder_context);
849 gen6_mfc_ind_obj_base_addr_state(ctx, gen6_encoder_context);
852 gen6_mfc_pipe_buf_addr_state(ctx, gen6_encoder_context);
853 gen6_mfc_bsp_buf_base_addr_state(ctx, gen6_encoder_context);
855 if (IS_GEN7(i965->intel.device_id)) {
856 gen7_mfc_avc_img_state(ctx, gen6_encoder_context);
857 gen7_mfc_avc_qm_state(ctx, gen6_encoder_context);
858 gen7_mfc_avc_fqm_state(ctx, gen6_encoder_context);
860 gen6_mfc_avc_img_state(ctx, gen6_encoder_context);
861 gen6_mfc_avc_qm_state(ctx, gen6_encoder_context);
862 gen6_mfc_avc_fqm_state(ctx, gen6_encoder_context);
865 gen6_mfc_avc_ref_idx_state(ctx, gen6_encoder_context);
866 gen6_mfc_avc_slice_state(ctx, pSliceParameter->slice_type, gen6_encoder_context, rate_control_mode == 0);
872 object_len_in_bytes = gen6_mfc_avc_pak_object_intra(ctx, x, y, last_mb, qp, msg, gen6_encoder_context, intra_mb_size);
875 object_len_in_bytes = gen6_mfc_avc_pak_object_inter(ctx, x, y, last_mb, qp, offset, gen6_encoder_context, inter_mb_size);
879 if (intel_batchbuffer_check_free_space(batch, object_len_in_bytes) == 0) {
880 intel_batchbuffer_end_atomic(batch);
881 intel_batchbuffer_flush(batch);
883 intel_batchbuffer_start_atomic_bcs(batch, 0x1000);
889 dri_bo_unmap(vme_context->vme_output.bo);
891 intel_batchbuffer_end_atomic(batch);
894 static VAStatus gen6_mfc_avc_prepare(VADriverContextP ctx,
895 struct encode_state *encode_state,
896 struct gen6_encoder_context *gen6_encoder_context)
898 struct i965_driver_data *i965 = i965_driver_data(ctx);
899 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
900 struct object_surface *obj_surface;
901 struct object_buffer *obj_buffer;
903 VAEncPictureParameterBufferH264Ext *pPicParameter = (VAEncPictureParameterBufferH264Ext *)encode_state->pic_param->buffer;
904 VAStatus vaStatus = VA_STATUS_SUCCESS;
907 /*Setup all the input&output object*/
908 obj_surface = SURFACE(pPicParameter->CurrPic.picture_id);
910 i965_check_alloc_surface_bo(ctx, obj_surface, 1, VA_FOURCC('N','V','1','2'));
912 mfc_context->post_deblocking_output.bo = obj_surface->bo;
913 dri_bo_reference(mfc_context->post_deblocking_output.bo);
915 mfc_context->surface_state.width = obj_surface->orig_width;
916 mfc_context->surface_state.height = obj_surface->orig_height;
917 mfc_context->surface_state.w_pitch = obj_surface->width;
918 mfc_context->surface_state.h_pitch = obj_surface->height;
920 for(i = 0; i < MAX_MFC_REFERENCE_SURFACES; i++) {
921 if ( pPicParameter->ReferenceFrames[i].picture_id != VA_INVALID_ID ) {
922 obj_surface = SURFACE(pPicParameter->ReferenceFrames[i].picture_id);
924 if (obj_surface->bo != NULL) {
925 mfc_context->reference_surfaces[i].bo = obj_surface->bo;
926 dri_bo_reference(obj_surface->bo);
933 obj_surface = SURFACE(encode_state->current_render_target);
934 assert(obj_surface && obj_surface->bo);
935 mfc_context->uncompressed_picture_source.bo = obj_surface->bo;
936 dri_bo_reference(mfc_context->uncompressed_picture_source.bo);
938 obj_buffer = BUFFER (pPicParameter->CodedBuf); /* FIXME: fix this later */
939 bo = obj_buffer->buffer_store->bo;
941 mfc_context->mfc_indirect_pak_bse_object.bo = bo;
942 mfc_context->mfc_indirect_pak_bse_object.offset = ALIGN(sizeof(VACodedBufferSegment), 64);
943 dri_bo_reference(mfc_context->mfc_indirect_pak_bse_object.bo);
945 /*Programing bcs pipeline*/
946 gen6_mfc_avc_pipeline_programing(ctx, encode_state, gen6_encoder_context); //filling the pipeline
951 static VAStatus gen6_mfc_run(VADriverContextP ctx,
952 struct encode_state *encode_state,
953 struct gen6_encoder_context *gen6_encoder_context)
955 struct intel_batchbuffer *batch = gen6_encoder_context->base.batch;
957 intel_batchbuffer_flush(batch); //run the pipeline
959 return VA_STATUS_SUCCESS;
962 static VAStatus gen6_mfc_stop(VADriverContextP ctx,
963 struct encode_state *encode_state,
964 struct gen6_encoder_context *gen6_encoder_context)
967 struct i965_driver_data *i965 = i965_driver_data(ctx);
968 struct gen6_mfc_context *mfc_context = &gen6_encoder_context->mfc_context;
970 VAEncPictureParameterBufferH264 *pPicParameter = (VAEncPictureParameterBufferH264 *)encode_state->pic_param->buffer;
972 struct object_surface *obj_surface = SURFACE(pPicParameter->reconstructed_picture);
973 //struct object_surface *obj_surface = SURFACE(pPicParameter->reference_picture[0]);
974 //struct object_surface *obj_surface = SURFACE(encode_state->current_render_target);
975 my_debug(obj_surface);
979 return VA_STATUS_SUCCESS;
983 gen6_mfc_avc_encode_picture(VADriverContextP ctx,
984 struct encode_state *encode_state,
985 struct gen6_encoder_context *gen6_encoder_context)
987 gen6_mfc_init(ctx, gen6_encoder_context);
988 gen6_mfc_avc_prepare(ctx, encode_state, gen6_encoder_context);
989 gen6_mfc_run(ctx, encode_state, gen6_encoder_context);
990 gen6_mfc_stop(ctx, encode_state, gen6_encoder_context);
992 return VA_STATUS_SUCCESS;
996 gen6_mfc_pipeline(VADriverContextP ctx,
998 struct encode_state *encode_state,
999 struct gen6_encoder_context *gen6_encoder_context)
1004 case VAProfileH264Baseline:
1005 vaStatus = gen6_mfc_avc_encode_picture(ctx, encode_state, gen6_encoder_context);
1008 /* FIXME: add for other profile */
1010 vaStatus = VA_STATUS_ERROR_UNSUPPORTED_PROFILE;
1017 Bool gen6_mfc_context_init(VADriverContextP ctx, struct gen6_mfc_context *mfc_context)
1022 Bool gen6_mfc_context_destroy(struct gen6_mfc_context *mfc_context)
1026 dri_bo_unreference(mfc_context->post_deblocking_output.bo);
1027 mfc_context->post_deblocking_output.bo = NULL;
1029 dri_bo_unreference(mfc_context->pre_deblocking_output.bo);
1030 mfc_context->pre_deblocking_output.bo = NULL;
1032 dri_bo_unreference(mfc_context->uncompressed_picture_source.bo);
1033 mfc_context->uncompressed_picture_source.bo = NULL;
1035 dri_bo_unreference(mfc_context->mfc_indirect_pak_bse_object.bo);
1036 mfc_context->mfc_indirect_pak_bse_object.bo = NULL;
1038 for (i = 0; i < NUM_MFC_DMV_BUFFERS; i++){
1039 dri_bo_unreference(mfc_context->direct_mv_buffers[i].bo);
1040 mfc_context->direct_mv_buffers[i].bo = NULL;
1043 dri_bo_unreference(mfc_context->intra_row_store_scratch_buffer.bo);
1044 mfc_context->intra_row_store_scratch_buffer.bo = NULL;
1046 dri_bo_unreference(mfc_context->macroblock_status_buffer.bo);
1047 mfc_context->macroblock_status_buffer.bo = NULL;
1049 dri_bo_unreference(mfc_context->deblocking_filter_row_store_scratch_buffer.bo);
1050 mfc_context->deblocking_filter_row_store_scratch_buffer.bo = NULL;
1052 dri_bo_unreference(mfc_context->bsd_mpc_row_store_scratch_buffer.bo);
1053 mfc_context->bsd_mpc_row_store_scratch_buffer.bo = NULL;