#include "shaders/post_processing/gen7/pa_to_pl3.g75b"
};
static const uint32_t pp_rgbx_load_save_nv12_gen8[][4] = {
-#include "shaders/post_processing/gen7/rgbx_to_nv12.g75b"
+#include "shaders/post_processing/gen8/rgbx_to_nv12.g8b"
};
static const uint32_t pp_nv12_load_save_rgbx_gen8[][4] = {
#include "shaders/post_processing/gen8/pl2_to_rgbx.g8b"
NULL,
},
- gen7_pp_rgbx_avs_initialize,
+ gen8_pp_plx_avs_initialize,
},
{
pl3_to_pl2.g8b \
pl3_to_pl3.g8b \
pl2_to_rgbx.g8b \
+ rgbx_to_nv12.g8b \
$(NULL)
INTEL_PP_G8A = \
PL3_AVS_Buf_1.g8a \
PL3_AVS_Buf_2.g8a \
PL3_AVS_Buf_3.g8a \
+ PA_AVS_Buf_0.g8a \
+ PA_AVS_Buf_1.g8a \
+ PA_AVS_Buf_2.g8a \
+ PA_AVS_Buf_3.g8a \
Save_AVS_NV12.g8a \
Save_AVS_PL3.g8a \
Save_AVS_RGBX.g8a \
Set_AVS_Buf_0123_PL2.g8a \
Set_AVS_Buf_0123_PL3.g8a \
+ Set_AVS_Buf_0123_BGRA.g8a \
YUV_to_RGB.g8a \
+ RGB_to_YUV.g8a \
Set_Layer_0.g8a \
VP_Setup.g8a \
$(NULL)
--- /dev/null
+/*
+ * Copyright 2000-2011 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+// 44 // Total instruction count
+// 1 // Total kernel count
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+// FileName: PL2_AVS_Buf_0.asm
+// Author: Tatiya, Rupesh
+// Description: Loads 8x8 AVS/IEF PL2 data into Buffer 0
+
+
+
+// FileName : PL2_AVS_Buf.asm
+// Author : Tatiya, Rupesh
+// Description : Loads 8x8 AVS/IEF PL2 data into Buffer N
+
+
+
+// Module name: Scaling.inc
+
+
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+
+
+// End of common.inc
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_4 Base=r28.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_5 Base=r46.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4BUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+//Pointer to mask reg
+
+
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+ // Message Header
+ // m0.7 31:0 Debug
+ // m0.6 31:0 Debug
+ // m0.5 31:0 Ignored
+ // m0.4 31:0 Ignored
+ // m0.3 31:0 Ignored
+ // m0.2 31:16 Ignored
+ // 15 Alpha Write Channel Mask enable=0, disable=1
+ // 14 Blue Write Channel Mask (U)
+ // 13 Green Write Channel Mask (Y)
+ // 12 Red Write Channel Mask (V)
+ // 11:0 Ignored
+ // m0.1 Ignored
+ // m0.0 Ignored
+
+
+ // AVS payload
+ // m1.7 Group ID Number
+ // m1.6 U 2nd Derivative ---> NLAS dx
+ // m1.5 Delta V ---> Step Y
+ // m1.4 Delta U ---> Step X
+ // m1.3 Pixel 0 V Address ---> ORIY (Y0)
+ // m1.2 Pixel 0 U Address ---> ORIX (X0)
+ // m1.1 Vertical Block Number
+ // m1.0 Reserved
+
+ // Sampler Message Descriptor
+ // 31:29 Reserved 000
+ // 28:25 Message length 0010
+ // 24:20 Response length xxxxx ---> 4GRFs for each enabled channel (AVS), 2GRFs for each enabled channel (sample unorm)
+ // 19 Header Present 1
+ // 18:17 SIMD Mode 11 ---> SIMD32/64
+ // 16:12 Message Type xxxxx ---> 01011 sample_8x8, 01100 (sample_unorm), 01010 (sample_unorm+killpix)
+ // 11:8 Sampler Index xxxx
+ // 7:0 Binding Table Index xxxxxxxx
+
+
+ // Msg Header M0.2
+ // 15:15 Alpha Write Channel Mask, 0: written back, 1: not written back
+ // 14:14 Blue Write Channel Mask
+ // 13:13 Green Write Channel Mask
+ // 12:12 Red Write Channel Mask
+
+
+//By design, Buffer 0,1,2,3 always have Layer 0 and Buffer 4,5 always have L1-L7
+
+
+//used to generate LABELS at compile time.
+
+
+ // 18:17 SIMD Mode 10 ---> SIMD16
+ // 16:12 Message Type xxxxx ---> 00000 (SIMD16)
+
+
+//r10-17 - 8 GRFs to load SIMD16 data (upto 4 channels)
+//r18-19 - 2 GRFs to store sampler ramp.
+
+ .declare mfSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare muwSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+ .declare mudCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare mubCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=1 SrcRegion=<32;32,1> DstRegion=<1> Type=ub
+
+
+ .declare fSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare udSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare ub4SCALING_0X_34X_TEMP Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<1> Type=ub
+ .declare uwSCALING_0X_34X_TEMP Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+ // Sampler ramp is used for Scaling 0X_0.34X
+ .declare fSAMPLER_RAMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> Type=f // 1 GRFs, 8 elements
+
+
+ //#define rMSGDSC_UV r23.0
+
+
+//End of _SCALING_
+
+
+ //NOTE: We need offsets for second halfof LAYER 0 - even if we do not load it.
+ //Update the channel offset in the buffers for the lower 8x4 data for BUFFER_0.
+ mov (1) r22.4<1>:ud 0x400040:ud
+
+
+ mov (1) r16.3<1>:ud r0.3<0;1,0>:ud
+
+
+ //AVS_PAYLOAD already has all the data loaded at this point
+ add (1) a0.0<1>:ud r23.5<0;1,0>:ud 0x50EB000:ud //msg desc
+
+ mov (1) r16.2<1>:ud 0x00000000:ud // Enable ARGB channels
+
+
+
+ // set the vertical block number
+
+ mov (1) r25.1<1>:ud 0:ud
+
+ mov (8) r17.0<1>:ud r25.0<8;8,1>:ud // Copy msg payload mirrors to MRFs
+
+ send (1) uwBUFFER_0(0)<1> r16 0x2 a0.0:ud
+ // Returns RGBA data in 16 GRFs in scrambled order
+
+SKIP_AVS_LOAD_L0_0_:
+ nop
+
+
--- /dev/null
+/*
+ * Copyright 2000-2011 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+// 44 // Total instruction count
+// 1 // Total kernel count
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+// FileName: PL2_AVS_Buf_0.asm
+// Author: Tatiya, Rupesh
+// Description: Loads 8x8 AVS/IEF PL2 data into Buffer 0
+
+
+
+// FileName : PL2_AVS_Buf.asm
+// Author : Tatiya, Rupesh
+// Description : Loads 8x8 AVS/IEF PL2 data into Buffer N
+
+
+
+// Module name: Scaling.inc
+
+
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+
+
+// End of common.inc
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_4 Base=r28.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_5 Base=r46.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4BUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+//Pointer to mask reg
+
+
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+ // Message Header
+ // m0.7 31:0 Debug
+ // m0.6 31:0 Debug
+ // m0.5 31:0 Ignored
+ // m0.4 31:0 Ignored
+ // m0.3 31:0 Ignored
+ // m0.2 31:16 Ignored
+ // 15 Alpha Write Channel Mask enable=0, disable=1
+ // 14 Blue Write Channel Mask (U)
+ // 13 Green Write Channel Mask (Y)
+ // 12 Red Write Channel Mask (V)
+ // 11:0 Ignored
+ // m0.1 Ignored
+ // m0.0 Ignored
+
+
+ // AVS payload
+ // m1.7 Group ID Number
+ // m1.6 U 2nd Derivative ---> NLAS dx
+ // m1.5 Delta V ---> Step Y
+ // m1.4 Delta U ---> Step X
+ // m1.3 Pixel 0 V Address ---> ORIY (Y0)
+ // m1.2 Pixel 0 U Address ---> ORIX (X0)
+ // m1.1 Vertical Block Number
+ // m1.0 Reserved
+
+ // Sampler Message Descriptor
+ // 31:29 Reserved 000
+ // 28:25 Message length 0010
+ // 24:20 Response length xxxxx ---> 4GRFs for each enabled channel (AVS), 2GRFs for each enabled channel (sample unorm)
+ // 19 Header Present 1
+ // 18:17 SIMD Mode 11 ---> SIMD32/64
+ // 16:12 Message Type xxxxx ---> 01011 sample_8x8, 01100 (sample_unorm), 01010 (sample_unorm+killpix)
+ // 11:8 Sampler Index xxxx
+ // 7:0 Binding Table Index xxxxxxxx
+
+
+ // Msg Header M0.2
+ // 15:15 Alpha Write Channel Mask, 0: written back, 1: not written back
+ // 14:14 Blue Write Channel Mask
+ // 13:13 Green Write Channel Mask
+ // 12:12 Red Write Channel Mask
+
+
+//By design, Buffer 0,1,2,3 always have Layer 0 and Buffer 4,5 always have L1-L7
+
+
+//used to generate LABELS at compile time.
+
+
+ // 18:17 SIMD Mode 10 ---> SIMD16
+ // 16:12 Message Type xxxxx ---> 00000 (SIMD16)
+
+
+//r10-17 - 8 GRFs to load SIMD16 data (upto 4 channels)
+//r18-19 - 2 GRFs to store sampler ramp.
+
+ .declare mfSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare muwSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+ .declare mudCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare mubCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=1 SrcRegion=<32;32,1> DstRegion=<1> Type=ub
+
+
+ .declare fSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare udSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare ub4SCALING_0X_34X_TEMP Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<1> Type=ub
+ .declare uwSCALING_0X_34X_TEMP Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+ // Sampler ramp is used for Scaling 0X_0.34X
+ .declare fSAMPLER_RAMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> Type=f // 1 GRFs, 8 elements
+
+
+ //#define rMSGDSC_UV r23.0
+
+
+//End of _SCALING_
+
+
+ //NOTE: We need offsets for second halfof LAYER 0 - even if we do not load it.
+ //Update the channel offset in the buffers for the lower 8x4 data for BUFFER_0.
+ mov (1) r22.4<1>:ud 0x400040:ud
+
+
+ mov (1) r16.3<1>:ud r0.3<0;1,0>:ud
+
+
+ //AVS_PAYLOAD already has all the data loaded at this point
+ add (1) a0.0<1>:ud r23.5<0;1,0>:ud 0x50EB000:ud //msg desc
+
+ mov (1) r16.2<1>:ud 0x00000000:ud // Enable ARGB channels
+
+
+
+ // set the vertical block number
+
+ mov (1) r25.1<1>:ud 1:ud
+
+ mov (8) r17.0<1>:ud r25.0<8;8,1>:ud // Copy msg payload mirrors to MRFs
+
+ send (1) uwBUFFER_1(0)<1> r16 0x2 a0.0:ud
+ // Returns RGBA data in 16 GRFs in scrambled order
+
+SKIP_AVS_LOAD_L0_0_:
+ nop
+
+
--- /dev/null
+/*
+ * Copyright 2000-2011 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+// 44 // Total instruction count
+// 1 // Total kernel count
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+// FileName: PL2_AVS_Buf_0.asm
+// Author: Tatiya, Rupesh
+// Description: Loads 8x8 AVS/IEF PL2 data into Buffer 0
+
+
+
+// FileName : PL2_AVS_Buf.asm
+// Author : Tatiya, Rupesh
+// Description : Loads 8x8 AVS/IEF PL2 data into Buffer N
+
+
+
+// Module name: Scaling.inc
+
+
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+
+
+// End of common.inc
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_4 Base=r28.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_5 Base=r46.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4BUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+//Pointer to mask reg
+
+
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+ // Message Header
+ // m0.7 31:0 Debug
+ // m0.6 31:0 Debug
+ // m0.5 31:0 Ignored
+ // m0.4 31:0 Ignored
+ // m0.3 31:0 Ignored
+ // m0.2 31:16 Ignored
+ // 15 Alpha Write Channel Mask enable=0, disable=1
+ // 14 Blue Write Channel Mask (U)
+ // 13 Green Write Channel Mask (Y)
+ // 12 Red Write Channel Mask (V)
+ // 11:0 Ignored
+ // m0.1 Ignored
+ // m0.0 Ignored
+
+
+ // AVS payload
+ // m1.7 Group ID Number
+ // m1.6 U 2nd Derivative ---> NLAS dx
+ // m1.5 Delta V ---> Step Y
+ // m1.4 Delta U ---> Step X
+ // m1.3 Pixel 0 V Address ---> ORIY (Y0)
+ // m1.2 Pixel 0 U Address ---> ORIX (X0)
+ // m1.1 Vertical Block Number
+ // m1.0 Reserved
+
+ // Sampler Message Descriptor
+ // 31:29 Reserved 000
+ // 28:25 Message length 0010
+ // 24:20 Response length xxxxx ---> 4GRFs for each enabled channel (AVS), 2GRFs for each enabled channel (sample unorm)
+ // 19 Header Present 1
+ // 18:17 SIMD Mode 11 ---> SIMD32/64
+ // 16:12 Message Type xxxxx ---> 01011 sample_8x8, 01100 (sample_unorm), 01010 (sample_unorm+killpix)
+ // 11:8 Sampler Index xxxx
+ // 7:0 Binding Table Index xxxxxxxx
+
+
+ // Msg Header M0.2
+ // 15:15 Alpha Write Channel Mask, 0: written back, 1: not written back
+ // 14:14 Blue Write Channel Mask
+ // 13:13 Green Write Channel Mask
+ // 12:12 Red Write Channel Mask
+
+
+//By design, Buffer 0,1,2,3 always have Layer 0 and Buffer 4,5 always have L1-L7
+
+
+//used to generate LABELS at compile time.
+
+
+ // 18:17 SIMD Mode 10 ---> SIMD16
+ // 16:12 Message Type xxxxx ---> 00000 (SIMD16)
+
+
+//r10-17 - 8 GRFs to load SIMD16 data (upto 4 channels)
+//r18-19 - 2 GRFs to store sampler ramp.
+
+ .declare mfSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare muwSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+ .declare mudCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare mubCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=1 SrcRegion=<32;32,1> DstRegion=<1> Type=ub
+
+
+ .declare fSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare udSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare ub4SCALING_0X_34X_TEMP Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<1> Type=ub
+ .declare uwSCALING_0X_34X_TEMP Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+ // Sampler ramp is used for Scaling 0X_0.34X
+ .declare fSAMPLER_RAMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> Type=f // 1 GRFs, 8 elements
+
+
+ //#define rMSGDSC_UV r23.0
+
+
+//End of _SCALING_
+
+
+ //NOTE: We need offsets for second halfof LAYER 0 - even if we do not load it.
+ //Update the channel offset in the buffers for the lower 8x4 data for BUFFER_0.
+ mov (1) r22.4<1>:ud 0x400040:ud
+
+
+ mov (1) r16.3<1>:ud r0.3<0;1,0>:ud
+
+
+ //AVS_PAYLOAD already has all the data loaded at this point
+ add (1) a0.0<1>:ud r23.5<0;1,0>:ud 0x50EB000:ud //msg desc
+
+ mov (1) r16.2<1>:ud 0x00000000:ud // Enable ARGB channels
+
+
+
+ // set the vertical block number
+
+ mov (1) r25.1<1>:ud 2:ud
+
+ mov (8) r17.0<1>:ud r25.0<8;8,1>:ud // Copy msg payload mirrors to MRFs
+
+ send (1) uwBUFFER_2(0)<1> r16 0x2 a0.0:ud
+ // Returns RGBA data in 16 GRFs in scrambled order
+
+SKIP_AVS_LOAD_L0_0_:
+ nop
+
+
--- /dev/null
+/*
+ * Copyright 2000-2011 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+// 44 // Total instruction count
+// 1 // Total kernel count
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+// FileName: PL2_AVS_Buf_0.asm
+// Author: Tatiya, Rupesh
+// Description: Loads 8x8 AVS/IEF PL2 data into Buffer 0
+
+
+
+// FileName : PL2_AVS_Buf.asm
+// Author : Tatiya, Rupesh
+// Description : Loads 8x8 AVS/IEF PL2 data into Buffer N
+
+
+
+// Module name: Scaling.inc
+
+
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+
+
+// End of common.inc
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_4 Base=r28.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_5 Base=r46.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4BUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+//Pointer to mask reg
+
+
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+ // Message Header
+ // m0.7 31:0 Debug
+ // m0.6 31:0 Debug
+ // m0.5 31:0 Ignored
+ // m0.4 31:0 Ignored
+ // m0.3 31:0 Ignored
+ // m0.2 31:16 Ignored
+ // 15 Alpha Write Channel Mask enable=0, disable=1
+ // 14 Blue Write Channel Mask (U)
+ // 13 Green Write Channel Mask (Y)
+ // 12 Red Write Channel Mask (V)
+ // 11:0 Ignored
+ // m0.1 Ignored
+ // m0.0 Ignored
+
+
+ // AVS payload
+ // m1.7 Group ID Number
+ // m1.6 U 2nd Derivative ---> NLAS dx
+ // m1.5 Delta V ---> Step Y
+ // m1.4 Delta U ---> Step X
+ // m1.3 Pixel 0 V Address ---> ORIY (Y0)
+ // m1.2 Pixel 0 U Address ---> ORIX (X0)
+ // m1.1 Vertical Block Number
+ // m1.0 Reserved
+
+ // Sampler Message Descriptor
+ // 31:29 Reserved 000
+ // 28:25 Message length 0010
+ // 24:20 Response length xxxxx ---> 4GRFs for each enabled channel (AVS), 2GRFs for each enabled channel (sample unorm)
+ // 19 Header Present 1
+ // 18:17 SIMD Mode 11 ---> SIMD32/64
+ // 16:12 Message Type xxxxx ---> 01011 sample_8x8, 01100 (sample_unorm), 01010 (sample_unorm+killpix)
+ // 11:8 Sampler Index xxxx
+ // 7:0 Binding Table Index xxxxxxxx
+
+
+ // Msg Header M0.2
+ // 15:15 Alpha Write Channel Mask, 0: written back, 1: not written back
+ // 14:14 Blue Write Channel Mask
+ // 13:13 Green Write Channel Mask
+ // 12:12 Red Write Channel Mask
+
+
+//By design, Buffer 0,1,2,3 always have Layer 0 and Buffer 4,5 always have L1-L7
+
+
+//used to generate LABELS at compile time.
+
+
+ // 18:17 SIMD Mode 10 ---> SIMD16
+ // 16:12 Message Type xxxxx ---> 00000 (SIMD16)
+
+
+//r10-17 - 8 GRFs to load SIMD16 data (upto 4 channels)
+//r18-19 - 2 GRFs to store sampler ramp.
+
+ .declare mfSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare muwSCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+ .declare mudCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare mubCALING_0X_34X_PAYLOAD Base=r14.0 ElementSize=1 SrcRegion=<32;32,1> DstRegion=<1> Type=ub
+
+
+ .declare fSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+ .declare udSCALING_0X_34X_TEMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+ .declare ub4SCALING_0X_34X_TEMP Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<1> Type=ub
+ .declare uwSCALING_0X_34X_TEMP Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+ // Sampler ramp is used for Scaling 0X_0.34X
+ .declare fSAMPLER_RAMP Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> Type=f // 1 GRFs, 8 elements
+
+
+ //#define rMSGDSC_UV r23.0
+
+
+//End of _SCALING_
+
+
+ //NOTE: We need offsets for second halfof LAYER 0 - even if we do not load it.
+ //Update the channel offset in the buffers for the lower 8x4 data for BUFFER_0.
+ mov (1) r22.4<1>:ud 0x400040:ud
+
+
+ mov (1) r16.3<1>:ud r0.3<0;1,0>:ud
+
+
+ //AVS_PAYLOAD already has all the data loaded at this point
+ add (1) a0.0<1>:ud r23.5<0;1,0>:ud 0x50EB000:ud //msg desc
+
+ mov (1) r16.2<1>:ud 0x00000000:ud // Enable ARGB channels
+
+
+
+ // set the vertical block number
+
+ mov (1) r25.1<1>:ud 3:ud
+
+ mov (8) r17.0<1>:ud r25.0<8;8,1>:ud // Copy msg payload mirrors to MRFs
+
+ send (1) uwBUFFER_3(0)<1> r16 0x2 a0.0:ud
+ // Returns RGBA data in 16 GRFs in scrambled order
+
+SKIP_AVS_LOAD_L0_0_:
+ nop
+
+
--- /dev/null
+/*
+ * Copyright 2000-2013 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * Authors:
+ * Zhao Yakui <yakui.zhao@intel.com>
+ */
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+// Module name: YUV_to_RGB.asm
+//
+// Convert YUV to RGB, handle it by 16x4 block
+//
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare bBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare bBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare bBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare bBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+//Pointer to mask reg
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+//Msg payload buffers; upto 4 full-size messages can be written
+
+//Unnecessary to use the MSGPayLoad, So it is temporiarily used for conversion of YUV->RGB
+
+.declare fBUFFER_R Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+.declare fBUFFER_G Base=r30.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+.declare fBUFFER_B Base=r32.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+.declare fBUFFER_Y Base=r36.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+.declare fBUFFER_U Base=r38.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+.declare fBUFFER_V Base=r40.0 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+.declare wTempY Base=r42.0 ElementSize=2 Type=w
+.declare wTempU Base=r44.0 ElementSize=2 Type=w
+.declare wTempV Base=r46.0 ElementSize=2 Type=w
+
+.declare ubTempY Base=r42.0 ElementSize=1 Type=ub
+.declare ubTempU Base=r44.0 ElementSize=1 Type=ub
+.declare ubTempV Base=r46.0 ElementSize=1 Type=ub
+
+ // the r17 register (nTEMP0) is originally defined from "Common.inc"
+ // instead of re-defining a nTEMP0 here, we use "SAVE_RGB" suffix for its naming
+
+ .declare uwTemp0 Base=r17.0 ElementSize=2 Type=uw
+
+
+//_SAVE_INC_
+ // ITU-R conversion, Now we are using ITU-R conversion
+ // Y = 0.299R + 0.587G + 0.114B
+ // U = -0.169R - 0.331G + 0.499B + 128
+ // V = 0.499R - 0.418G - 0.0813B+ 128
+
+ // At the save module we have all 8 address sub-registers available.
+ // So we will use PING-PONG type of scheme to save the data using
+ // pointers pBUF_CHNL_TOP_8x4 and pBUF_CHNL_BOT_8x4. This will help
+ // reduce dependency. - rT
+
+ //wBUFF_CHNL_PTR points to either buffer 0 or buffer 4.
+ //Add appropriate offsets to get pointers for all buffers (1,2,3 or 5).
+ //Offsets are zero for buffer 0 and buffer 4.
+ //It always uses the YUVA layout.
+//for BUFFER_0
+ mov (4) a0.0<1>:uw r22.0<4;4,1>:uw
+ mov (4) a0.4<1>:uw r22.0<4;4,1>:uw
+ // YUV uses the a0.5,a0.6 and a0.4 as the indirect-register
+ // Y = a0.5, U=a0.6, V=a0.4
+ // if channel swap?
+ // This means that it should be BGRX(B is the LSB) or RGBX
+ // 1 means that it is BGRX.
+ and.nz.f0.0 null<1>:w r2.0<0;1,0>:uw 0x01:w
+ // pointer swap
+ (f0.0) mov (1) uwTemp0<1> a0.0:uw
+ (f0.0) mov (1) a0.0:uw a0.1:uw
+ (f0.0) mov (1) a0.1:uw uwTemp0<0;1,0>
+
+//the first line in the block 0
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 1]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 17]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 1]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 17]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 1]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 17]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 0]<1>:uw 0:uw
+ mov (16) r[a0.6, 0]<1>:uw 0:uw
+ mov (16) r[a0.4, 0]<1>:uw 0:uw
+ mov (16) r[a0.5,1]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,1]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,1]<2>:ub ubTempV(0, 0)<32;8,4>
+
+
+//the second line in the block 0
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 33]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 49]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 33]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 49]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 33]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 49]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 32]<1>:uw 0:uw
+ mov (16) r[a0.6, 32]<1>:uw 0:uw
+ mov (16) r[a0.4, 32]<1>:uw 0:uw
+ mov (16) r[a0.5,33]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,33]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,33]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the third line in the block 0
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 65]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 81]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 65]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 81]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 65]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 81]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 64]<1>:uw 0:uw
+ mov (16) r[a0.6, 64]<1>:uw 0:uw
+ mov (16) r[a0.4, 64]<1>:uw 0:uw
+ mov (16) r[a0.5,65]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,65]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,65]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the fourth line in the block 0
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 97]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 113]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 97]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 113]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 97]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 113]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 96]<1>:uw 0:uw
+ mov (16) r[a0.6, 96]<1>:uw 0:uw
+ mov (16) r[a0.4, 96]<1>:uw 0:uw
+ mov (16) r[a0.5,97]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,97]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,97]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//for Buffer_1
+
+ add (8) a0.0<1>:uw a0.0<8;8,1>:uw 512:uw
+//the first line in the block 1
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 1]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 17]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 1]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 17]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 1]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 17]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 0]<1>:uw 0:uw
+ mov (16) r[a0.6, 0]<1>:uw 0:uw
+ mov (16) r[a0.4, 0]<1>:uw 0:uw
+ mov (16) r[a0.5,1]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,1]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,1]<2>:ub ubTempV(0, 0)<32;8,4>
+
+
+//the second line in the block 1
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 33]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 49]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 33]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 49]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 33]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 49]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 32]<1>:uw 0:uw
+ mov (16) r[a0.6, 32]<1>:uw 0:uw
+ mov (16) r[a0.4, 32]<1>:uw 0:uw
+ mov (16) r[a0.5,33]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,33]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,33]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the third line in the block 1
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 65]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 81]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 65]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 81]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 65]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 81]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 64]<1>:uw 0:uw
+ mov (16) r[a0.6, 64]<1>:uw 0:uw
+ mov (16) r[a0.4, 64]<1>:uw 0:uw
+ mov (16) r[a0.5,65]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,65]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,65]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the fourth line in the block 1
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 97]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 113]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 97]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 113]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 97]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 113]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 96]<1>:uw 0:uw
+ mov (16) r[a0.6, 96]<1>:uw 0:uw
+ mov (16) r[a0.4, 96]<1>:uw 0:uw
+ mov (16) r[a0.5,97]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,97]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,97]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//for Buffer_2
+ add (8) a0.0<1>:uw a0.0<8;8,1>:uw 512:uw
+//the first line in the block 2
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 1]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 17]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 1]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 17]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 1]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 17]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 0]<1>:uw 0:uw
+ mov (16) r[a0.6, 0]<1>:uw 0:uw
+ mov (16) r[a0.4, 0]<1>:uw 0:uw
+ mov (16) r[a0.5,1]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,1]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,1]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the second line in the block 2
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 33]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 49]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 33]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 49]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 33]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 49]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 32]<1>:uw 0:uw
+ mov (16) r[a0.6, 32]<1>:uw 0:uw
+ mov (16) r[a0.4, 32]<1>:uw 0:uw
+ mov (16) r[a0.5,33]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,33]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,33]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the third line in the block 2
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 65]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 81]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 65]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 81]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 65]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 81]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 64]<1>:uw 0:uw
+ mov (16) r[a0.6, 64]<1>:uw 0:uw
+ mov (16) r[a0.4, 64]<1>:uw 0:uw
+ mov (16) r[a0.5,65]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,65]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,65]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the fourth line in the block 2
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 97]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 113]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 97]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 113]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 97]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 113]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 96]<1>:uw 0:uw
+ mov (16) r[a0.6, 96]<1>:uw 0:uw
+ mov (16) r[a0.4, 96]<1>:uw 0:uw
+ mov (16) r[a0.5,97]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,97]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,97]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//for Buffer_3
+ add (8) a0.0<1>:uw a0.0<8;8,1>:uw 512:uw
+//the first line in the block 3
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 1]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 17]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 1]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 17]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 1]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 17]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 0]<1>:uw 0:uw
+ mov (16) r[a0.6, 0]<1>:uw 0:uw
+ mov (16) r[a0.4, 0]<1>:uw 0:uw
+ mov (16) r[a0.5,1]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,1]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,1]<2>:ub ubTempV(0, 0)<32;8,4>
+
+
+//the second line in the block 3
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 33]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 49]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 33]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 49]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 33]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 49]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 32]<1>:uw 0:uw
+ mov (16) r[a0.6, 32]<1>:uw 0:uw
+ mov (16) r[a0.4, 32]<1>:uw 0:uw
+ mov (16) r[a0.5,33]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,33]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,33]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the third line in the block 3
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 65]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 81]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 65]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 81]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 65]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 81]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 64]<1>:uw 0:uw
+ mov (16) r[a0.6, 64]<1>:uw 0:uw
+ mov (16) r[a0.4, 64]<1>:uw 0:uw
+ mov (16) r[a0.5,65]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,65]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,65]<2>:ub ubTempV(0, 0)<32;8,4>
+
+//the fourth line in the block 3
+ mov (8) fBUFFER_R(0, 0)<1> r[a0.1, 97]<16;8,2>:ub
+ mov (8) fBUFFER_R(1, 0)<1> r[a0.1, 113]<16;8,2>:ub
+ mov (8) fBUFFER_G(0, 0)<1> r[a0.2, 97]<16;8,2>:ub
+ mov (8) fBUFFER_G(1, 0)<1> r[a0.2, 113]<16;8,2>:ub
+ mov (8) fBUFFER_B(0, 0)<1> r[a0.0, 97]<16;8,2>:ub
+ mov (8) fBUFFER_B(1, 0)<1> r[a0.0, 113]<16;8,2>:ub
+
+ mul (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.299f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> 0.587f
+ mac (16) fBUFFER_Y(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.114f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> -0.169f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.331f
+ mac (16) fBUFFER_U(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> 0.499f
+
+ mov (16) acc0.0<1>:f 128.0f
+ mac (16) acc0.0<1>:f fBUFFER_R(0, 0)<8;8,1> 0.499f
+ mac (16) acc0.0<1>:f fBUFFER_G(0, 0)<8;8,1> -0.418f
+ mac (16) fBUFFER_V(0, 0)<1> fBUFFER_B(0, 0)<8;8,1> -0.0813f
+
+ mov (16) wTempY(0,0)<2> fBUFFER_Y(0, 0)<8;8,1>
+ mov (16) wTempU(0,0)<2> fBUFFER_U(0, 0)<8;8,1>
+ mov (16) wTempV(0,0)<2> fBUFFER_V(0, 0)<8;8,1>
+
+ mov (16) r[a0.5, 96]<1>:uw 0:uw
+ mov (16) r[a0.6, 96]<1>:uw 0:uw
+ mov (16) r[a0.4, 96]<1>:uw 0:uw
+ mov (16) r[a0.5,97]<2>:ub ubTempY(0, 0)<32;8,4>
+ mov (16) r[a0.6,97]<2>:ub ubTempU(0, 0)<32;8,4>
+ mov (16) r[a0.4,97]<2>:ub ubTempV(0, 0)<32;8,4>
+
--- /dev/null
+/*
+ * Copyright 2000-2013 Intel Corporation All Rights Reserved
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ * Authors: Zhao Yakui <yakui.zhao@intel.com>
+ */
+// 7 // Total instruction count
+// 1 // Total kernel count
+
+
+
+// Module name: common.inc
+//
+// Common header file for all Video-Processing kernels
+//
+
+.default_execution_size (16)
+.default_register_type :ub
+
+.reg_count_total 128
+.reg_count_payload 7
+
+//========== Common constants ==========
+
+
+//========== Macros ==========
+
+
+//Fast Jump, For more details see "Set_Layer_N.asm"
+
+
+//========== Defines ====================
+
+//========== Static Parameters (Common To All) ==========
+//r1
+
+
+//r2
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+//Color Pipe (IECP) parameters
+
+
+//ByteCopy
+
+
+//r4
+
+ // e.g. byte0 byte1 byte2
+ // YUYV 0 1 3
+ // YVYU 0 3 1
+
+
+//========== Inline parameters (Common To All) ===========
+
+
+//============== Binding Index Table===========
+//Common between DNDI and DNUV
+
+
+//================= Common Message Descriptor =====
+// Message descriptor for thread spawning
+// Message Descriptors
+// = 000 0001 (min message len 1 ) 0,0000 (resp len 0 -add later)
+// 0000,0000,0000
+// 0001(Spawn a root thread),0001 (Root thread spawn thread)
+// = 0x02000011
+// Thread Spawner Message Descriptor
+
+
+// Message descriptor for atomic operation add
+// Message Descriptors
+// = 000 0110 (min message len 6 ) 0,0000 (resp len 0 -add later)
+// 1(header present)001,10(typed atomic operation)0(return enabled)0(slot group, low 8 bits),0111 (AOP_Add)
+// 0000,0000 (Binding table index, added later)
+// = 0x02000011
+
+// Atomic Operation Add Message Descriptor
+
+
+// Message descriptor for dataport media write
+ // Message Descriptors
+ // = 000 0001 (min message len 1 - add later) 00000 (resp len 0)
+ // 1 (header present 1) 0 1010 (media block write) 000000
+ // 00000000 (binding table index - set later)
+ // = 0x020A8000
+
+
+// Message Length defines
+
+
+// Response Length defines
+
+
+// Block Width and Height Size defines
+
+
+// Extended Message Descriptors
+
+
+// Common message descriptors:
+
+
+//===================== Math Function Control ===================================
+
+
+//============ Message Registers ===============
+ // buf4 starts from r28
+
+
+//#define mMSGHDR_EOT r43 // Dummy Message Register for EOT
+
+
+.declare mubMSGPAYLOAD Base=r30 ElementSize=1 SrcRegion=<16;16,1> Type=ub
+.declare muwMSGPAYLOAD Base=r30 ElementSize=2 SrcRegion=<16;16,1> Type=uw
+.declare mudMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=ud
+.declare mfMSGPAYLOAD Base=r30 ElementSize=4 SrcRegion=<8;8,1> Type=f
+
+//=================== End of thread instruction ===========================
+
+
+//=====================Pointers Used=====================================
+
+
+//=======================================================================
+
+
+//r9-r17
+// Define temp space for any usages
+
+
+// Common Buffers
+
+
+// temp space for rotation
+
+.declare fROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udROBUF Base=r9.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwROBUF Base=r9.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubROBUF Base=r9.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4ROBUF Base=r9.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+
+// End of common.inc
+
+
+//Module Name: Set_AVS_Buf_0123_BGRA.asm
+
+
+
+//Module Name: Set_Buf_0123_BGRA
+
+
+
+
+// Description: Includes all definitions explicit to Fast Composite.
+
+
+
+
+// End of common.inc
+
+
+//========== GRF partition ==========
+ // r0 header : r0 (1 GRF)
+ // Static parameters : r1 - r6 (6 GRFS)
+ // Inline parameters : r7 - r8 (2 GRFs)
+ // MSGSRC : r27 (1 GRF)
+//===================================
+
+//Interface:
+//========== Static Parameters (Explicit To Fast Composite) ==========
+//r1
+//CSC Set 0
+
+
+.declare udCSC_CURBE Base=r1.0 ElementSize=4 Type=ud
+
+//Constant alpha
+
+
+//r2
+
+
+// Gen7 AVS WA
+
+
+// WiDi Definitions
+
+
+//Colorfill
+
+
+ // 0: 0-degree, 1: 90, 2: 180, 3: 270-degree, clockwise.
+
+.declare ubCOLOR_PIXEL_VAL Base=r2.20 ElementSize=1 SrcRegion=<0;1,0> DstRegion=<1> Type=ub
+
+//r3
+//Normalised Ratio of Horizontal step size with main video for all layers
+
+
+ //Normalised Ratio of Horizontal step size with main video for all layers becomes
+ //Normalised Horizontal step size for all layers in VP_Setup.asm
+
+
+//r4
+//Normalised Vertical step size for all layers
+
+
+//r5
+//Normalised Vertical Frame Origin for all layers
+
+
+//r6
+//Normalised Horizontal Frame Origin for all layers
+
+
+//========== Inline Parameters (Explicit To Fast Composite) ==========
+
+
+//Main video Step X
+
+
+//====================== Binding table (Explicit To Fast Composite)=========================================
+
+
+//Used by Interlaced Scaling Kernels
+
+
+//========== Sampler State Table Index (Explicit To Fast Composite)==========
+//Sampler Index for AVS/IEF messages
+
+
+//Sampler Index for SIMD16 sampler messages
+
+
+//=============================================================================
+
+.declare fBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+.declare fBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=f
+
+.declare udBUFFER_0 Base=r64.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_1 Base=r80.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_2 Base=r96.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_3 Base=r112.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_4 Base=r28.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+.declare udBUFFER_5 Base=r46.0 ElementSize=4 SrcRegion=<8;8,1> DstRegion=<1> Type=ud
+
+.declare uwBUFFER_0 Base=r64.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_1 Base=r80.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_2 Base=r96.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_3 Base=r112.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_4 Base=r28.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+.declare uwBUFFER_5 Base=r46.0 ElementSize=2 SrcRegion=<16;16,1> DstRegion=<1> Type=uw
+
+.declare ubBUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+.declare ubBUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<16;16,1> DstRegion=<1> Type=ub
+
+.declare ub4BUFFER_0 Base=r64.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_1 Base=r80.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_2 Base=r96.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_3 Base=r112.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_4 Base=r28.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+.declare ub4BUFFER_5 Base=r46.0 ElementSize=1 SrcRegion=<32;8,4> DstRegion=<4> Type=ub
+
+//Pointer to mask reg
+
+
+//r18
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+.declare udCSC_COEFF_0 Base=r18.0 ElementSize=4 Type=ud // 1 GRF
+
+//r19
+
+
+.declare udCSC_COEFF_1 Base=r19.0 ElementSize=4 Type=ud // 1 GRF
+
+
+//r20
+
+.declare uwALPHA_MASK_REG_TEMP Base=r20.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r21
+
+.declare uwALPHA_MASK_REG Base=r21.0 ElementSize=2 SrcRegion=<16;16,1> Type=uw // 1 GRF
+
+//r22
+
+
+//Always keep Cannel Pointers and Offsets in same GRF, so that we can use
+// NODDCLR, NODDCHK flags. -rT
+
+
+//Keep fORIGIN_X_NLAS, fY_OFFSET_2ND_BLOCK, fSTEP_X_NLAS, pMSGDSC_COPY, ubCONST_ALPHA_COPY as
+//sub registers of same GRF to enable using NODDCLR NODDCHK. -rT
+
+//r23
+
+
+//Lumakey
+
+
+//r24
+
+
+//r25
+
+
+//r26
+
+
+//defines to generate LABELS during compile time.
+
+
+ //AVS LAYOUT:(UUYYVVAA)
+ //AVS RGBX LAYOUT (RRGGBBAA)
+ //Assign buffer channel order for Buffer 0123 in the order AUYV a0.3>A, a0.2>U, a0.1>Y, a0.0>V
+ // V = 8, Y= 0, U = 4, A = 12.
+ // And a0.x is used as indirect-register for RGBX. R=a0.1, G=a0.2, B=a0.0
+ // B = 8, R= 0, G = 4, A = 12
+ mov (4) acc0.0<1>:w 0x6EA2:v
+ add (4) acc0.0<1>:w acc0<4;4,1>:w 70:uw
+ shl (4) r22.0<1>:w acc0<4;4,1>:w 5:uw
+
+ //OPT: wAVS_SU_SHUFFLE_PTR_0 and udAVS_SU_SHUFFLE_OFF_0 are sub-regs of same GRF. -rT
+
+ //SU LAYOUT:(VYUAVYUA)
+ //V = 4, Y = 2, U = 0, A = 6
+ //B = 4, G = 2, R = 0, A = 6
+ mov (4) acc0.0<1>:w 0x6204:v
+ add (4) acc0.0<1>:w acc0<4;4,1>:w 64:uw
+ shl (4) r18.0<1>:w acc0<4;4,1>:w 5:uw { NoDDClr } //Convert to BYTE address.
+
+ //OFFSET:
+ mov (1) r18.4<1>:ud 0x1000100:ud { NoDDChk }
+
+
--- /dev/null
+// Module name: AVS
+.kernel RGBX_TO_NV12
+.code
+
+#include "VP_Setup.g8a"
+#include "Set_Layer_0.g8a"
+#include "Set_AVS_Buf_0123_BGRA.g8a"
+#include "PA_AVS_Buf_0.g8a"
+#include "PA_AVS_Buf_1.g8a"
+#include "PA_AVS_Buf_2.g8a"
+#include "PA_AVS_Buf_3.g8a"
+#include "RGB_to_YUV.g8a"
+#include "Save_AVS_NV12.g8a"
+#include "EOT.g8a"
+
+.end_code
+
+.end_kernel
--- /dev/null
+ { 0x00600001, 0x23600208, 0x008d0000, 0x00000000 },
+ { 0x00600001, 0x23200208, 0x008d0000, 0x00000000 },
+ { 0x00600001, 0x23400208, 0x008d0000, 0x00000000 },
+ { 0x00600041, 0x20603ae8, 0x3a8d0060, 0x000000f0 },
+ { 0x00200001, 0x21141ae8, 0x004500e0, 0x00000000 },
+ { 0x01000010, 0x20002220, 0x1600005a, 0x00010001 },
+ { 0x00000008, 0x22201248, 0x16000044, 0x00000000 },
+ { 0x00000005, 0x22201248, 0x16000220, 0x00030003 },
+ { 0x01000010, 0x20001261, 0x16000220, 0x00010001 },
+ { 0x00010020, 0x34000005, 0x0e001400, 0x00000090 },
+ { 0x01000010, 0x20001261, 0x16000220, 0x00020002 },
+ { 0x00010020, 0x34000005, 0x0e001400, 0x000000f0 },
+ { 0x01000010, 0x20001261, 0x16000220, 0x00030003 },
+ { 0x00010020, 0x34000005, 0x0e001400, 0x00000180 },
+ { 0x00110001, 0x24003ae0, 0x000000c0, 0x00000000 },
+ { 0x00110048, 0x20c03ae8, 0x3a000060, 0x00000114 },
+ { 0x00000001, 0x24003ae0, 0x000000a0, 0x00000000 },
+ { 0x00000048, 0x20a03ae8, 0x3a000080, 0x00000118 },
+ { 0x00000020, 0x34000004, 0x0e001400, 0x000001a0 },
+ { 0x00110001, 0x24003ae0, 0x000000c0, 0x00000000 },
+ { 0x00110048, 0x20c03ae8, 0x3a000060, 0x00000118 },
+ { 0x00000001, 0x220012e8, 0x00000040, 0x00000000 },
+ { 0x00000040, 0x22203ae8, 0x3a004114, 0x00000200 },
+ { 0x00000040, 0x22203ae8, 0x3e000220, 0xc1800000 },
+ { 0x00000001, 0x24003ae0, 0x000000a0, 0x00000000 },
+ { 0x00000048, 0x20a03ae8, 0x3a000080, 0x00000220 },
+ { 0x00000020, 0x34000004, 0x0e001400, 0x00000120 },
+ { 0x00110001, 0x220012e8, 0x00000040, 0x00000000 },
+ { 0x00110040, 0x22203ae8, 0x3a004114, 0x00000200 },
+ { 0x00110040, 0x22203ae8, 0x3e000220, 0xc1800000 },
+ { 0x00110001, 0x24003ae0, 0x000000c0, 0x00000000 },
+ { 0x00110048, 0x20c03ae8, 0x3a000060, 0x00000220 },
+ { 0x00000001, 0x220012e8, 0x00000042, 0x00000000 },
+ { 0x00000040, 0x22203ae8, 0x3a004118, 0x00000200 },
+ { 0x00000040, 0x22203ae8, 0x3e000220, 0xc1800000 },
+ { 0x00000001, 0x24003ae0, 0x000000a0, 0x00000000 },
+ { 0x00000048, 0x20a03ae8, 0x3a000080, 0x00000220 },
+ { 0x00000020, 0x34000004, 0x0e001400, 0x00000070 },
+ { 0x00110001, 0x220012e8, 0x00000042, 0x00000000 },
+ { 0x00110040, 0x22203ae8, 0x3a004118, 0x00000200 },
+ { 0x00110040, 0x22203ae8, 0x3e000220, 0xc1800000 },
+ { 0x00110001, 0x24003ae0, 0x000000c0, 0x00000000 },
+ { 0x00110048, 0x20c03ae8, 0x3a000060, 0x00000220 },
+ { 0x00000001, 0x24003ae0, 0x000000a0, 0x00000000 },
+ { 0x00000048, 0x20a03ae8, 0x3a000080, 0x00000114 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00800001, 0x22a01648, 0x10000000, 0xffffffff },
+ { 0x00000005, 0x23021288, 0x16000044, 0x00030003 },
+ { 0x00000001, 0x23203ae8, 0x000000f8, 0x00000000 },
+ { 0x00000001, 0x23383ae8, 0x000000f4, 0x00000000 },
+ { 0x00000001, 0x23303ae8, 0x00000060, 0x00000000 },
+ { 0x00000001, 0x23343ae8, 0x00000080, 0x00000000 },
+ { 0x00000001, 0x23283ae8, 0x000000c0, 0x00000000 },
+ { 0x00000001, 0x232c3ae8, 0x000000a0, 0x00000000 },
+ { 0x00000001, 0x233c0608, 0x00000000, 0x00000000 },
+ { 0x00000040, 0x233c0208, 0x0600033c, 0x08000000 },
+ { 0x00000001, 0x24083ae0, 0x000000c0, 0x00000000 },
+ { 0x00000048, 0x24083ae0, 0x3e000060, 0x41000000 },
+ { 0x00000248, 0x22e83ae8, 0x3e0000f4, 0x41e00000 },
+ { 0x00000641, 0x22e43ae8, 0x3e000080, 0x40800000 },
+ { 0x00000001, 0x24103ae0, 0x00000060, 0x00000000 },
+ { 0x00000648, 0x22f03ae8, 0x3e0000f4, 0x41000000 },
+ { 0x00000401, 0x22f40608, 0x00000000, 0x00000000 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00400001, 0x24003660, 0x30000000, 0x00006ea2 },
+ { 0x00400040, 0x24001860, 0x16690400, 0x00460046 },
+ { 0x00400009, 0x22c01868, 0x16690400, 0x00050005 },
+ { 0x00400001, 0x24003660, 0x30000000, 0x00006204 },
+ { 0x00400040, 0x24001860, 0x16690400, 0x00400040 },
+ { 0x00400209, 0x22401868, 0x16690400, 0x00050005 },
+ { 0x00000401, 0x22500608, 0x00000000, 0x01000100 },
+ { 0x00000001, 0x22d00608, 0x00000000, 0x00400040 },
+ { 0x00000001, 0x220c0208, 0x0000000c, 0x00000000 },
+ { 0x00000040, 0x22000200, 0x060002f4, 0x050eb000 },
+ { 0x00000001, 0x22080608, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x23240608, 0x00000000, 0x00000000 },
+ { 0x00600001, 0x22200208, 0x008d0320, 0x00000000 },
+ { 0x02000031, 0x28002248, 0x00000200, 0x00000200 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x22d00608, 0x00000000, 0x00400040 },
+ { 0x00000001, 0x220c0208, 0x0000000c, 0x00000000 },
+ { 0x00000040, 0x22000200, 0x060002f4, 0x050eb000 },
+ { 0x00000001, 0x22080608, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x23240608, 0x00000000, 0x00000001 },
+ { 0x00600001, 0x22200208, 0x008d0320, 0x00000000 },
+ { 0x02000031, 0x2a002248, 0x00000200, 0x00000200 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x22d00608, 0x00000000, 0x00400040 },
+ { 0x00000001, 0x220c0208, 0x0000000c, 0x00000000 },
+ { 0x00000040, 0x22000200, 0x060002f4, 0x050eb000 },
+ { 0x00000001, 0x22080608, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x23240608, 0x00000000, 0x00000002 },
+ { 0x00600001, 0x22200208, 0x008d0320, 0x00000000 },
+ { 0x02000031, 0x2c002248, 0x00000200, 0x00000200 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x22d00608, 0x00000000, 0x00400040 },
+ { 0x00000001, 0x220c0208, 0x0000000c, 0x00000000 },
+ { 0x00000040, 0x22000200, 0x060002f4, 0x050eb000 },
+ { 0x00000001, 0x22080608, 0x00000000, 0x00000000 },
+ { 0x00000001, 0x23240608, 0x00000000, 0x00000003 },
+ { 0x00600001, 0x22200208, 0x008d0320, 0x00000000 },
+ { 0x02000031, 0x2e002248, 0x00000200, 0x00000200 },
+ { 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+ { 0x00400001, 0x22001240, 0x006902c0, 0x00000000 },
+ { 0x00400001, 0x22081240, 0x006902c0, 0x00000000 },
+ { 0x02800005, 0x20001260, 0x1e000040, 0x00010001 },
+ { 0x00010001, 0x22201048, 0x00000200, 0x00000000 },
+ { 0x00010001, 0x22001040, 0x00000202, 0x00000000 },
+ { 0x00010001, 0x22021240, 0x00000220, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8201, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8211, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8401, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8411, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8001, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8011, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca012288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc012288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8012288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8221, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8231, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8421, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8431, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8021, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8031, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca212288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc212288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8212288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8241, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8251, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8441, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8451, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8041, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8051, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca412288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc412288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8412288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8261, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8271, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8461, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8471, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8061, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8071, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca612288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc612288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8612288, 0x00cf05c0, 0x00000000 },
+ { 0x00600040, 0x22001040, 0x168d0200, 0x02000200 },
+ { 0x00600001, 0x238022e8, 0x00ae8201, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8211, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8401, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8411, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8001, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8011, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca012288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc012288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8012288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8221, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8231, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8421, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8431, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8021, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8031, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca212288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc212288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8212288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8241, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8251, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8441, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8451, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8041, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8051, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca412288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc412288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8412288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8261, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8271, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8461, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8471, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8061, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8071, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca612288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc612288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8612288, 0x00cf05c0, 0x00000000 },
+ { 0x00600040, 0x22001040, 0x168d0200, 0x02000200 },
+ { 0x00600001, 0x238022e8, 0x00ae8201, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8211, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8401, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8411, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8001, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8011, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca012288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc012288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8012288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8221, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8231, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8421, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8431, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8021, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8031, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca212288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc212288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8212288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8241, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8251, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8441, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8451, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8041, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8051, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca412288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc412288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8412288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8261, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8271, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8461, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8471, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8061, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8071, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca612288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc612288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8612288, 0x00cf05c0, 0x00000000 },
+ { 0x00600040, 0x22001040, 0x168d0200, 0x02000200 },
+ { 0x00600001, 0x238022e8, 0x00ae8201, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8211, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8401, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8411, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8001, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8011, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8001648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca012288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc012288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8012288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8221, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8231, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8421, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8431, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8021, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8031, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8201648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca212288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc212288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8212288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8241, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8251, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8441, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8451, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8041, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8051, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8401648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca412288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc412288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8412288, 0x00cf05c0, 0x00000000 },
+ { 0x00600001, 0x238022e8, 0x00ae8261, 0x00000000 },
+ { 0x00600001, 0x23a022e8, 0x00ae8271, 0x00000000 },
+ { 0x00600001, 0x23c022e8, 0x00ae8461, 0x00000000 },
+ { 0x00600001, 0x23e022e8, 0x00ae8471, 0x00000000 },
+ { 0x00600001, 0x240022e8, 0x00ae8061, 0x00000000 },
+ { 0x00600001, 0x242022e8, 0x00ae8071, 0x00000000 },
+ { 0x00800041, 0x24003ae0, 0x3e8d0380, 0x3e991687 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0x3f1645a2 },
+ { 0x00800048, 0x24803ae8, 0x3e8d0400, 0x3de978d5 },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0xbe2d0e56 },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbea978d5 },
+ { 0x00800048, 0x24c03ae8, 0x3e8d0400, 0x3eff7cee },
+ { 0x00800001, 0x24003ee0, 0x38000000, 0x43000000 },
+ { 0x00800048, 0x24003ae0, 0x3e8d0380, 0x3eff7cee },
+ { 0x00800048, 0x24003ae0, 0x3e8d03c0, 0xbed60419 },
+ { 0x00800048, 0x25003ae8, 0x3e8d0400, 0xbda6809d },
+ { 0x00800001, 0x45403a68, 0x008d0480, 0x00000000 },
+ { 0x00800001, 0x45803a68, 0x008d04c0, 0x00000000 },
+ { 0x00800001, 0x45c03a68, 0x008d0500, 0x00000000 },
+ { 0x00800001, 0xaa601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xac601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xa8601648, 0x10000000, 0x00000000 },
+ { 0x00800001, 0xca612288, 0x00cf0540, 0x00000000 },
+ { 0x00800001, 0xcc612288, 0x00cf0580, 0x00000000 },
+ { 0x00800001, 0xc8612288, 0x00cf05c0, 0x00000000 },
+ { 0x00400040, 0x22001a40, 0x166902c0, 0x00000000 },
+ { 0x00400040, 0x22081a40, 0x166902c0, 0x02000200 },
+ { 0x00600001, 0x23800208, 0x008d0360, 0x00000000 },
+ { 0x00600001, 0x24a00208, 0x008d0360, 0x00000000 },
+ { 0x00200201, 0x23801a28, 0x004500e0, 0x00000000 },
+ { 0x00000201, 0x24a01a28, 0x000000e0, 0x00000000 },
+ { 0x00000608, 0x24a41a28, 0x1e0000e2, 0x00010001 },
+ { 0x00000401, 0x23880608, 0x00000000, 0x000f000f },
+ { 0x00000401, 0x24a80608, 0x00000000, 0x0007000f },
+ { 0x80800040, 0xa2001248, 0x16b18200, 0x00800080 },
+ { 0x80800040, 0xa2201248, 0x16b18220, 0x00800080 },
+ { 0x80800040, 0xa2401248, 0x16b18240, 0x00800080 },
+ { 0x80800040, 0xa2601248, 0x16b18260, 0x00800080 },
+ { 0x00600008, 0x45c01248, 0x1eae8400, 0x00010001 },
+ { 0x00600008, 0x45e01248, 0x1eae8420, 0x00010001 },
+ { 0x00600008, 0x46001248, 0x1eae8440, 0x00010001 },
+ { 0x00600008, 0x46201248, 0x1eae8460, 0x00010001 },
+ { 0x00600040, 0x45c01248, 0x12ae05c0, 0x00ae05e0 },
+ { 0x80600040, 0xc4001248, 0x16ae05c0, 0x00800080 },
+ { 0x00600040, 0x46001248, 0x12ae0600, 0x00ae0620 },
+ { 0x80600040, 0xc4401248, 0x16ae0600, 0x00800080 },
+ { 0x00600008, 0x46401248, 0x1eae8000, 0x00010001 },
+ { 0x00600008, 0x46601248, 0x1eae8020, 0x00010001 },
+ { 0x00600008, 0x46801248, 0x1eae8040, 0x00010001 },
+ { 0x00600008, 0x46a01248, 0x1eae8060, 0x00010001 },
+ { 0x00600040, 0x46401248, 0x12ae0640, 0x00ae0660 },
+ { 0x80600040, 0xc0001248, 0x16ae0640, 0x00800080 },
+ { 0x00600040, 0x46801248, 0x12ae0680, 0x00ae06a0 },
+ { 0x80600040, 0xc0401248, 0x16ae0680, 0x00800080 },
+ { 0x00400040, 0x22001a40, 0x166902c0, 0x04000400 },
+ { 0x80800040, 0xaa001248, 0x16b18a00, 0x00800080 },
+ { 0x80800040, 0xaa201248, 0x16b18a20, 0x00800080 },
+ { 0x80800040, 0xaa401248, 0x16b18a40, 0x00800080 },
+ { 0x80800040, 0xaa601248, 0x16b18a60, 0x00800080 },
+ { 0x00600008, 0x45c01248, 0x1eae8c00, 0x00010001 },
+ { 0x00600008, 0x45e01248, 0x1eae8c20, 0x00010001 },
+ { 0x00600008, 0x46001248, 0x1eae8c40, 0x00010001 },
+ { 0x00600008, 0x46201248, 0x1eae8c60, 0x00010001 },
+ { 0x00600040, 0x45c01248, 0x12ae05c0, 0x00ae05e0 },
+ { 0x80600040, 0xcc001248, 0x16ae05c0, 0x00800080 },
+ { 0x00600040, 0x46001248, 0x12ae0600, 0x00ae0620 },
+ { 0x80600040, 0xcc401248, 0x16ae0600, 0x00800080 },
+ { 0x00600008, 0x46401248, 0x1eae8800, 0x00010001 },
+ { 0x00600008, 0x46601248, 0x1eae8820, 0x00010001 },
+ { 0x00600008, 0x46801248, 0x1eae8840, 0x00010001 },
+ { 0x00600008, 0x46a01248, 0x1eae8860, 0x00010001 },
+ { 0x00600040, 0x46401248, 0x12ae0640, 0x00ae0660 },
+ { 0x80600040, 0xc8001248, 0x16ae0640, 0x00800080 },
+ { 0x00600040, 0x46801248, 0x12ae0680, 0x00ae06a0 },
+ { 0x80600040, 0xc8401248, 0x16ae0680, 0x00800080 },
+ { 0x00400040, 0x22081a40, 0x166902c0, 0x06000600 },
+ { 0x80800040, 0xa2001248, 0x16b18200, 0x00800080 },
+ { 0x80800040, 0xa2201248, 0x16b18220, 0x00800080 },
+ { 0x80800040, 0xa2401248, 0x16b18240, 0x00800080 },
+ { 0x80800040, 0xa2601248, 0x16b18260, 0x00800080 },
+ { 0x00600008, 0x45c01248, 0x1eae8400, 0x00010001 },
+ { 0x00600008, 0x45e01248, 0x1eae8420, 0x00010001 },
+ { 0x00600008, 0x46001248, 0x1eae8440, 0x00010001 },
+ { 0x00600008, 0x46201248, 0x1eae8460, 0x00010001 },
+ { 0x00600040, 0x45c01248, 0x12ae05c0, 0x00ae05e0 },
+ { 0x80600040, 0xc4001248, 0x16ae05c0, 0x00800080 },
+ { 0x00600040, 0x46001248, 0x12ae0600, 0x00ae0620 },
+ { 0x80600040, 0xc4401248, 0x16ae0600, 0x00800080 },
+ { 0x00600008, 0x46401248, 0x1eae8000, 0x00010001 },
+ { 0x00600008, 0x46601248, 0x1eae8020, 0x00010001 },
+ { 0x00600008, 0x46801248, 0x1eae8040, 0x00010001 },
+ { 0x00600008, 0x46a01248, 0x1eae8060, 0x00010001 },
+ { 0x00600040, 0x46401248, 0x12ae0640, 0x00ae0660 },
+ { 0x80600040, 0xc0001248, 0x16ae0640, 0x00800080 },
+ { 0x00600040, 0x46801248, 0x12ae0680, 0x00ae06a0 },
+ { 0x80600040, 0xc0401248, 0x16ae0680, 0x00800080 },
+ { 0x00400040, 0x22001a40, 0x166902c0, 0x04000400 },
+ { 0x80800040, 0xaa001248, 0x16b18a00, 0x00800080 },
+ { 0x80800040, 0xaa201248, 0x16b18a20, 0x00800080 },
+ { 0x80800040, 0xaa401248, 0x16b18a40, 0x00800080 },
+ { 0x80800040, 0xaa601248, 0x16b18a60, 0x00800080 },
+ { 0x00600008, 0x45c01248, 0x1eae8c00, 0x00010001 },
+ { 0x00600008, 0x45e01248, 0x1eae8c20, 0x00010001 },
+ { 0x00600008, 0x46001248, 0x1eae8c40, 0x00010001 },
+ { 0x00600008, 0x46201248, 0x1eae8c60, 0x00010001 },
+ { 0x00600040, 0x45c01248, 0x12ae05c0, 0x00ae05e0 },
+ { 0x80600040, 0xcc001248, 0x16ae05c0, 0x00800080 },
+ { 0x00600040, 0x46001248, 0x12ae0600, 0x00ae0620 },
+ { 0x80600040, 0xcc401248, 0x16ae0600, 0x00800080 },
+ { 0x00600008, 0x46401248, 0x1eae8800, 0x00010001 },
+ { 0x00600008, 0x46601248, 0x1eae8820, 0x00010001 },
+ { 0x00600008, 0x46801248, 0x1eae8840, 0x00010001 },
+ { 0x00600008, 0x46a01248, 0x1eae8860, 0x00010001 },
+ { 0x00600040, 0x46401248, 0x12ae0640, 0x00ae0660 },
+ { 0x80600040, 0xc8001248, 0x16ae0640, 0x00800080 },
+ { 0x00600040, 0x46801248, 0x12ae0680, 0x00ae06a0 },
+ { 0x80600040, 0xc8401248, 0x16ae0680, 0x00800080 },
+ { 0x00400040, 0x22081a40, 0x166902c0, 0x06000600 },
+ { 0x00400040, 0x22001a40, 0x166902c0, 0x00000000 },
+ { 0x00400040, 0x22081a40, 0x166902c0, 0x02000200 },
+ { 0x00800201, 0x23a02288, 0x00d28201, 0x00000000 },
+ { 0x00800401, 0x23b02288, 0x00d28221, 0x00000000 },
+ { 0x00800201, 0x23c02288, 0x00d28241, 0x00000000 },
+ { 0x00800401, 0x23d02288, 0x00d28261, 0x00000000 },
+ { 0x00600201, 0x44c02288, 0x00cf8401, 0x00000000 },
+ { 0x00600601, 0x44d02288, 0x00cf8441, 0x00000000 },
+ { 0x00600601, 0x44c12288, 0x00cf8001, 0x00000000 },
+ { 0x00600401, 0x44d12288, 0x00cf8041, 0x00000000 },
+ { 0x00400040, 0x22001a40, 0x166902c0, 0x04000400 },
+ { 0x00800201, 0x23e02288, 0x00d28a01, 0x00000000 },
+ { 0x00800401, 0x23f02288, 0x00d28a21, 0x00000000 },
+ { 0x00800201, 0x24002288, 0x00d28a41, 0x00000000 },
+ { 0x00800401, 0x24102288, 0x00d28a61, 0x00000000 },
+ { 0x00600201, 0x44e02288, 0x00cf8c01, 0x00000000 },
+ { 0x00600601, 0x44f02288, 0x00cf8c41, 0x00000000 },
+ { 0x00600601, 0x44e12288, 0x00cf8801, 0x00000000 },
+ { 0x00600401, 0x44f12288, 0x00cf8841, 0x00000000 },
+ { 0x00400040, 0x22081a40, 0x166902c0, 0x06000600 },
+ { 0x00800201, 0x24202288, 0x00d28201, 0x00000000 },
+ { 0x00800401, 0x24302288, 0x00d28221, 0x00000000 },
+ { 0x00800201, 0x24402288, 0x00d28241, 0x00000000 },
+ { 0x00800401, 0x24502288, 0x00d28261, 0x00000000 },
+ { 0x00600201, 0x45002288, 0x00cf8401, 0x00000000 },
+ { 0x00600601, 0x45102288, 0x00cf8441, 0x00000000 },
+ { 0x00600601, 0x45012288, 0x00cf8001, 0x00000000 },
+ { 0x00600401, 0x45112288, 0x00cf8041, 0x00000000 },
+ { 0x00800201, 0x24602288, 0x00d28a01, 0x00000000 },
+ { 0x00800401, 0x24702288, 0x00d28a21, 0x00000000 },
+ { 0x00800201, 0x24802288, 0x00d28a41, 0x00000000 },
+ { 0x00800401, 0x24902288, 0x00d28a61, 0x00000000 },
+ { 0x00600201, 0x45202288, 0x00cf8c01, 0x00000000 },
+ { 0x00600601, 0x45302288, 0x00cf8c41, 0x00000000 },
+ { 0x00600601, 0x45212288, 0x00cf8801, 0x00000000 },
+ { 0x00600401, 0x45312288, 0x00cf8841, 0x00000000 },
+ { 0x0c000031, 0x20002220, 0x06000380, 0x120a8018 },
+ { 0x0c000031, 0x20002220, 0x060004a0, 0x0a0a8019 },
+ { 0x00600001, 0x2fe00208, 0x008d0000, 0x00000000 },
+ { 0x07000031, 0x20002220, 0x0e000fe0, 0x82000010 },