xref: /aosp_15_r20/external/igt-gpu-tools/lib/i915/shaders/ps/blit.g7a (revision d83cc019efdc2edc6c4b16e9034a3ceb8d35d77c)
1*d83cc019SAndroid Build Coastguard Worker/* Assemble with  ".../intel-gen4asm/src/intel-gen4asm -g 7" */
2*d83cc019SAndroid Build Coastguard Worker
3*d83cc019SAndroid Build Coastguard Worker
4*d83cc019SAndroid Build Coastguard Worker/* Move pixels into g10-g13. The pixel shaader does not load what you want. It
5*d83cc019SAndroid Build Coastguard Worker * loads the input data for a plane function to calculate what you want. The
6*d83cc019SAndroid Build Coastguard Worker * following is boiler plate code to move our normalized texture coordinates
7*d83cc019SAndroid Build Coastguard Worker * (u,v) into g10-g13. It does this 4 subspans (16 pixels) at a time.
8*d83cc019SAndroid Build Coastguard Worker *
9*d83cc019SAndroid Build Coastguard Worker * This should do the same thing, but it doesn't work for some reason.
10*d83cc019SAndroid Build Coastguard Worker *   pln(16) g10 g6<0,1,0>F g2<8,8,1>F	{ align1 };
11*d83cc019SAndroid Build Coastguard Worker *   pln(16) g12 g6.16<1>F g2<8,8,1>F	{ align1 };
12*d83cc019SAndroid Build Coastguard Worker */
13*d83cc019SAndroid Build Coastguard Worker/* U */
14*d83cc019SAndroid Build Coastguard Workerpln (8) g10<1>F g6.0<0,1,0>F g2.0<8,8,1>F { align1 }; /* pixel 0-7 */
15*d83cc019SAndroid Build Coastguard Workerpln (8) g11<1>F g6.0<0,1,0>F g4.0<8,8,1>F { align1 }; /* pixel 8-15 */
16*d83cc019SAndroid Build Coastguard Worker/* V */
17*d83cc019SAndroid Build Coastguard Workerpln (8) g12<1>F g6.16<0,1,0> g2.0<8,8,1>F { align1 }; /* pixel 0-7 */
18*d83cc019SAndroid Build Coastguard Workerpln (8) g13<1>F g6.16<0,1,0> g4.0<8,8,1>F { align1 }; /* pixel 8-15 */
19*d83cc019SAndroid Build Coastguard Worker
20*d83cc019SAndroid Build Coastguard Worker
21*d83cc019SAndroid Build Coastguard Worker/* Next the we want the sampler to fetch the src texture (ie. src buffer). This
22*d83cc019SAndroid Build Coastguard Worker * is done with a pretty simple send message. The output goes to g112, which is
23*d83cc019SAndroid Build Coastguard Worker * exactly what we're supposed to use in our final send message.
24*d83cc019SAndroid Build Coastguard Worker * In intel-gen4asm, we should end up parsed by the following rule:
25*d83cc019SAndroid Build Coastguard Worker *   predicate SEND execsize dst sendleadreg sndopr directsrcoperand instoptions
26*d83cc019SAndroid Build Coastguard Worker *
27*d83cc019SAndroid Build Coastguard Worker * Send message descriptor:
28*d83cc019SAndroid Build Coastguard Worker * 28:25 = message len = 4 // our 4 registers have 16 pixels
29*d83cc019SAndroid Build Coastguard Worker * 24:20 = response len = 8 // Each pixel is RGBA32, so we need 8 registers
30*d83cc019SAndroid Build Coastguard Worker * 19:19 = header present = 0
31*d83cc019SAndroid Build Coastguard Worker * 18:17 = SIMD16 = 2
32*d83cc019SAndroid Build Coastguard Worker * 16:12 = TYPE = 0  (regular sample)
33*d83cc019SAndroid Build Coastguard Worker * 11:08 = Sampler index = ignored/0
34*d83cc019SAndroid Build Coastguard Worker * 7:0 = binding table index = src = 1
35*d83cc019SAndroid Build Coastguard Worker * 0x8840001
36*d83cc019SAndroid Build Coastguard Worker *
37*d83cc019SAndroid Build Coastguard Worker * Send message extra descriptor
38*d83cc019SAndroid Build Coastguard Worker * 5:5 = End of Thread = 0
39*d83cc019SAndroid Build Coastguard Worker * 3:0 = Target Function ID = SFID_SAMPLER (2)
40*d83cc019SAndroid Build Coastguard Worker * 0x2
41*d83cc019SAndroid Build Coastguard Worker */
42*d83cc019SAndroid Build Coastguard Worker
43*d83cc019SAndroid Build Coastguard Workersend(16) g112 g10 0x2 0x8840001 { align1 };
44*d83cc019SAndroid Build Coastguard Worker
45*d83cc019SAndroid Build Coastguard Worker/* g112-g119 now contains the sample source input, and all we must do is write
46*d83cc019SAndroid Build Coastguard Worker * it out to the destination render target. This is done with the send message
47*d83cc019SAndroid Build Coastguard Worker * as well. The only extra bits are to terminate the pixel shader.
48*d83cc019SAndroid Build Coastguard Worker *
49*d83cc019SAndroid Build Coastguard Worker * Send message descriptor:
50*d83cc019SAndroid Build Coastguard Worker * 28:25 = message len = 8 // 16 pixels RGBA32
51*d83cc019SAndroid Build Coastguard Worker * 24:20 = response len = 0
52*d83cc019SAndroid Build Coastguard Worker * 19:19 = header present = 0
53*d83cc019SAndroid Build Coastguard Worker * 17:14 = message type = Render Target Write (12)
54*d83cc019SAndroid Build Coastguard Worker * 12:12 = Last Render Target Select = 1
55*d83cc019SAndroid Build Coastguard Worker * 10:08 = Message Type = SIMD16 (0)
56*d83cc019SAndroid Build Coastguard Worker * 07:00 = Binding Table Index = dest = 0
57*d83cc019SAndroid Build Coastguard Worker * 0x10031000
58*d83cc019SAndroid Build Coastguard Worker *
59*d83cc019SAndroid Build Coastguard Worker * Send message extra descriptor
60*d83cc019SAndroid Build Coastguard Worker * 5:5 = End of Thread = 1
61*d83cc019SAndroid Build Coastguard Worker * 3:0 = Target Function ID = SFID_DP_RC (5)
62*d83cc019SAndroid Build Coastguard Worker * 0x25
63*d83cc019SAndroid Build Coastguard Worker */
64*d83cc019SAndroid Build Coastguard Workersend(16) null g112  0x25 0x10031000 { align1, EOT };
65*d83cc019SAndroid Build Coastguard Worker
66*d83cc019SAndroid Build Coastguard Worker/* vim: set ft=c ts=4 sw=2 tw=80 et: */
67