1. store_src_rg coords = src.rg | |
2. init_lane_masks CondMask = LoopMask = RetMask = true | |
3. copy_constant _0_ok = 0xFFFFFFFF | |
4. copy_constant _1_splat_4(0) = 0x40800000 (4.0) | |
5. copy_constant _1_splat_4(1) = 0x40800000 (4.0) | |
6. copy_constant _1_splat_4(2) = 0x40800000 (4.0) | |
7. copy_constant _1_splat_4(3) = 0x40800000 (4.0) | |
8. copy_constant _1_splat_4(4) = 0x40800000 (4.0) | |
9. copy_constant _1_splat_4(5) = 0x40800000 (4.0) | |
10. copy_constant _1_splat_4(6) = 0x40800000 (4.0) | |
11. copy_constant _1_splat_4(7) = 0x40800000 (4.0) | |
12. copy_constant _1_splat_4(8) = 0x40800000 (4.0) | |
13. copy_constant _2_splat_2(0) = 0x40000000 (2.0) | |
14. copy_constant _2_splat_2(1) = 0x40000000 (2.0) | |
15. copy_constant _2_splat_2(2) = 0x40000000 (2.0) | |
16. copy_constant _2_splat_2(3) = 0x40000000 (2.0) | |
17. copy_constant _2_splat_2(4) = 0x40000000 (2.0) | |
18. copy_constant _2_splat_2(5) = 0x40000000 (2.0) | |
19. copy_constant _2_splat_2(6) = 0x40000000 (2.0) | |
20. copy_constant _2_splat_2(7) = 0x40000000 (2.0) | |
21. copy_constant _2_splat_2(8) = 0x40000000 (2.0) | |
22. zero_4_slots_unmasked _3_m(0..3) = 0 | |
23. zero_4_slots_unmasked _3_m(4..7) = 0 | |
24. zero_slot_unmasked _3_m(8) = 0 | |
25. zero_slot_unmasked $0 = 0 | |
26. copy_constant $1 = 0x40000000 (2.0) | |
27. shuffle $0..8 = ($0..8)[1 0 0 0 1 0 0 0 1] | |
28. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
29. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
30. copy_slot_unmasked _3_m(8) = $8 | |
31. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
32. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
33. copy_slot_unmasked $8 = _3_m(8) | |
34. copy_4_slots_unmasked $9..12 = _1_splat_4(0..3) | |
35. copy_4_slots_unmasked $13..16 = _1_splat_4(4..7) | |
36. copy_slot_unmasked $17 = _1_splat_4(8) | |
37. add_n_floats $0..8 += $9..17 | |
38. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
39. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
40. copy_slot_unmasked _3_m(8) = $8 | |
41. copy_slot_unmasked $0 = _0_ok | |
42. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
43. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
44. copy_slot_unmasked $9 = _3_m(8) | |
45. copy_constant $10 = 0x40C00000 (6.0) | |
46. copy_constant $11 = 0x40800000 (4.0) | |
47. copy_constant $12 = 0x40800000 (4.0) | |
48. copy_constant $13 = 0x40800000 (4.0) | |
49. copy_constant $14 = 0x40C00000 (6.0) | |
50. copy_constant $15 = 0x40800000 (4.0) | |
51. copy_constant $16 = 0x40800000 (4.0) | |
52. copy_constant $17 = 0x40800000 (4.0) | |
53. copy_constant $18 = 0x40C00000 (6.0) | |
54. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
55. bitwise_and_4_ints $2..5 &= $6..9 | |
56. bitwise_and_2_ints $2..3 &= $4..5 | |
57. bitwise_and_int $2 &= $3 | |
58. bitwise_and_int $1 &= $2 | |
59. bitwise_and_int $0 &= $1 | |
60. copy_slot_unmasked _0_ok = $0 | |
61. zero_slot_unmasked $0 = 0 | |
62. copy_constant $1 = 0x40000000 (2.0) | |
63. shuffle $0..8 = ($0..8)[1 0 0 0 1 0 0 0 1] | |
64. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
65. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
66. copy_slot_unmasked _3_m(8) = $8 | |
67. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
68. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
69. copy_slot_unmasked $8 = _3_m(8) | |
70. copy_4_slots_unmasked $9..12 = _1_splat_4(0..3) | |
71. copy_4_slots_unmasked $13..16 = _1_splat_4(4..7) | |
72. copy_slot_unmasked $17 = _1_splat_4(8) | |
73. sub_n_floats $0..8 -= $9..17 | |
74. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
75. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
76. copy_slot_unmasked _3_m(8) = $8 | |
77. copy_slot_unmasked $0 = _0_ok | |
78. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
79. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
80. copy_slot_unmasked $9 = _3_m(8) | |
81. copy_constant $10 = 0xC0000000 (-2.0) | |
82. copy_constant $11 = 0xC0800000 (-4.0) | |
83. copy_constant $12 = 0xC0800000 (-4.0) | |
84. copy_constant $13 = 0xC0800000 (-4.0) | |
85. copy_constant $14 = 0xC0000000 (-2.0) | |
86. copy_constant $15 = 0xC0800000 (-4.0) | |
87. copy_constant $16 = 0xC0800000 (-4.0) | |
88. copy_constant $17 = 0xC0800000 (-4.0) | |
89. copy_constant $18 = 0xC0000000 (-2.0) | |
90. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
91. bitwise_and_4_ints $2..5 &= $6..9 | |
92. bitwise_and_2_ints $2..3 &= $4..5 | |
93. bitwise_and_int $2 &= $3 | |
94. bitwise_and_int $1 &= $2 | |
95. bitwise_and_int $0 &= $1 | |
96. copy_slot_unmasked _0_ok = $0 | |
97. zero_slot_unmasked $0 = 0 | |
98. copy_constant $1 = 0x40000000 (2.0) | |
99. shuffle $0..8 = ($0..8)[1 0 0 0 1 0 0 0 1] | |
100. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
101. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
102. copy_slot_unmasked _3_m(8) = $8 | |
103. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
104. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
105. copy_slot_unmasked $8 = _3_m(8) | |
106. copy_4_slots_unmasked $9..12 = _1_splat_4(0..3) | |
107. copy_4_slots_unmasked $13..16 = _1_splat_4(4..7) | |
108. copy_slot_unmasked $17 = _1_splat_4(8) | |
109. div_n_floats $0..8 /= $9..17 | |
110. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
111. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
112. copy_slot_unmasked _3_m(8) = $8 | |
113. copy_slot_unmasked $0 = _0_ok | |
114. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
115. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
116. copy_slot_unmasked $9 = _3_m(8) | |
117. zero_slot_unmasked $10 = 0 | |
118. copy_constant $11 = 0x3F000000 (0.5) | |
119. shuffle $10..18 = ($10..18)[1 0 0 0 1 0 0 0 1] | |
120. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
121. bitwise_and_4_ints $2..5 &= $6..9 | |
122. bitwise_and_2_ints $2..3 &= $4..5 | |
123. bitwise_and_int $2 &= $3 | |
124. bitwise_and_int $1 &= $2 | |
125. bitwise_and_int $0 &= $1 | |
126. copy_slot_unmasked _0_ok = $0 | |
127. copy_4_slots_unmasked $0..3 = _1_splat_4(0..3) | |
128. copy_4_slots_unmasked $4..7 = _1_splat_4(4..7) | |
129. copy_slot_unmasked $8 = _1_splat_4(8) | |
130. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
131. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
132. copy_slot_unmasked _3_m(8) = $8 | |
133. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
134. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
135. copy_slot_unmasked $8 = _3_m(8) | |
136. zero_slot_unmasked $9 = 0 | |
137. copy_constant $10 = 0x40000000 (2.0) | |
138. shuffle $9..17 = ($9..17)[1 0 0 0 1 0 0 0 1] | |
139. add_n_floats $0..8 += $9..17 | |
140. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
141. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
142. copy_slot_unmasked _3_m(8) = $8 | |
143. copy_slot_unmasked $0 = _0_ok | |
144. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
145. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
146. copy_slot_unmasked $9 = _3_m(8) | |
147. copy_constant $10 = 0x40C00000 (6.0) | |
148. copy_constant $11 = 0x40800000 (4.0) | |
149. copy_constant $12 = 0x40800000 (4.0) | |
150. copy_constant $13 = 0x40800000 (4.0) | |
151. copy_constant $14 = 0x40C00000 (6.0) | |
152. copy_constant $15 = 0x40800000 (4.0) | |
153. copy_constant $16 = 0x40800000 (4.0) | |
154. copy_constant $17 = 0x40800000 (4.0) | |
155. copy_constant $18 = 0x40C00000 (6.0) | |
156. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
157. bitwise_and_4_ints $2..5 &= $6..9 | |
158. bitwise_and_2_ints $2..3 &= $4..5 | |
159. bitwise_and_int $2 &= $3 | |
160. bitwise_and_int $1 &= $2 | |
161. bitwise_and_int $0 &= $1 | |
162. copy_slot_unmasked _0_ok = $0 | |
163. copy_4_slots_unmasked $0..3 = _1_splat_4(0..3) | |
164. copy_4_slots_unmasked $4..7 = _1_splat_4(4..7) | |
165. copy_slot_unmasked $8 = _1_splat_4(8) | |
166. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
167. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
168. copy_slot_unmasked _3_m(8) = $8 | |
169. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
170. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
171. copy_slot_unmasked $8 = _3_m(8) | |
172. zero_slot_unmasked $9 = 0 | |
173. copy_constant $10 = 0x40000000 (2.0) | |
174. shuffle $9..17 = ($9..17)[1 0 0 0 1 0 0 0 1] | |
175. sub_n_floats $0..8 -= $9..17 | |
176. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
177. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
178. copy_slot_unmasked _3_m(8) = $8 | |
179. copy_slot_unmasked $0 = _0_ok | |
180. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
181. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
182. copy_slot_unmasked $9 = _3_m(8) | |
183. copy_constant $10 = 0x40000000 (2.0) | |
184. copy_constant $11 = 0x40800000 (4.0) | |
185. copy_constant $12 = 0x40800000 (4.0) | |
186. copy_constant $13 = 0x40800000 (4.0) | |
187. copy_constant $14 = 0x40000000 (2.0) | |
188. copy_constant $15 = 0x40800000 (4.0) | |
189. copy_constant $16 = 0x40800000 (4.0) | |
190. copy_constant $17 = 0x40800000 (4.0) | |
191. copy_constant $18 = 0x40000000 (2.0) | |
192. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
193. bitwise_and_4_ints $2..5 &= $6..9 | |
194. bitwise_and_2_ints $2..3 &= $4..5 | |
195. bitwise_and_int $2 &= $3 | |
196. bitwise_and_int $1 &= $2 | |
197. bitwise_and_int $0 &= $1 | |
198. copy_slot_unmasked _0_ok = $0 | |
199. copy_4_slots_unmasked $0..3 = _1_splat_4(0..3) | |
200. copy_4_slots_unmasked $4..7 = _1_splat_4(4..7) | |
201. copy_slot_unmasked $8 = _1_splat_4(8) | |
202. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
203. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
204. copy_slot_unmasked _3_m(8) = $8 | |
205. copy_4_slots_unmasked $0..3 = _3_m(0..3) | |
206. copy_4_slots_unmasked $4..7 = _3_m(4..7) | |
207. copy_slot_unmasked $8 = _3_m(8) | |
208. copy_4_slots_unmasked $9..12 = _2_splat_2(0..3) | |
209. copy_4_slots_unmasked $13..16 = _2_splat_2(4..7) | |
210. copy_slot_unmasked $17 = _2_splat_2(8) | |
211. div_n_floats $0..8 /= $9..17 | |
212. copy_4_slots_unmasked _3_m(0..3) = $0..3 | |
213. copy_4_slots_unmasked _3_m(4..7) = $4..7 | |
214. copy_slot_unmasked _3_m(8) = $8 | |
215. copy_slot_unmasked $0 = _0_ok | |
216. copy_4_slots_unmasked $1..4 = _3_m(0..3) | |
217. copy_4_slots_unmasked $5..8 = _3_m(4..7) | |
218. copy_slot_unmasked $9 = _3_m(8) | |
219. copy_constant $10 = 0x40000000 (2.0) | |
220. copy_constant $11 = 0x40000000 (2.0) | |
221. copy_constant $12 = 0x40000000 (2.0) | |
222. copy_constant $13 = 0x40000000 (2.0) | |
223. copy_constant $14 = 0x40000000 (2.0) | |
224. copy_constant $15 = 0x40000000 (2.0) | |
225. copy_constant $16 = 0x40000000 (2.0) | |
226. copy_constant $17 = 0x40000000 (2.0) | |
227. copy_constant $18 = 0x40000000 (2.0) | |
228. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
229. bitwise_and_4_ints $2..5 &= $6..9 | |
230. bitwise_and_2_ints $2..3 &= $4..5 | |
231. bitwise_and_int $2 &= $3 | |
232. bitwise_and_int $1 &= $2 | |
233. bitwise_and_int $0 &= $1 | |
234. copy_slot_unmasked _0_ok = $0 | |
235. copy_constant _4_m(0) = 0x3F800000 (1.0) | |
236. copy_constant _4_m(1) = 0x40000000 (2.0) | |
237. copy_constant _4_m(2) = 0x40400000 (3.0) | |
238. copy_constant _4_m(3) = 0x40800000 (4.0) | |
239. copy_constant _4_m(4) = 0x40A00000 (5.0) | |
240. copy_constant _4_m(5) = 0x40C00000 (6.0) | |
241. copy_constant _4_m(6) = 0x40E00000 (7.0) | |
242. copy_constant _4_m(7) = 0x41000000 (8.0) | |
243. copy_constant _4_m(8) = 0x41100000 (9.0) | |
244. copy_constant _4_m(9) = 0x41200000 (10.0) | |
245. copy_constant _4_m(10) = 0x41300000 (11.0) | |
246. copy_constant _4_m(11) = 0x41400000 (12.0) | |
247. copy_constant _4_m(12) = 0x41500000 (13.0) | |
248. copy_constant _4_m(13) = 0x41600000 (14.0) | |
249. copy_constant _4_m(14) = 0x41700000 (15.0) | |
250. copy_constant _4_m(15) = 0x41800000 (16.0) | |
251. copy_4_slots_unmasked $0..3 = _4_m(0..3) | |
252. copy_4_slots_unmasked $4..7 = _4_m(4..7) | |
253. copy_4_slots_unmasked $8..11 = _4_m(8..11) | |
254. copy_4_slots_unmasked $12..15 = _4_m(12..15) | |
255. copy_constant $16 = 0x41800000 (16.0) | |
256. copy_constant $17 = 0x41700000 (15.0) | |
257. copy_constant $18 = 0x41600000 (14.0) | |
258. copy_constant $19 = 0x41500000 (13.0) | |
259. copy_constant $20 = 0x41400000 (12.0) | |
260. copy_constant $21 = 0x41300000 (11.0) | |
261. copy_constant $22 = 0x41200000 (10.0) | |
262. copy_constant $23 = 0x41100000 (9.0) | |
263. copy_constant $24 = 0x41000000 (8.0) | |
264. copy_constant $25 = 0x40E00000 (7.0) | |
265. copy_constant $26 = 0x40C00000 (6.0) | |
266. copy_constant $27 = 0x40A00000 (5.0) | |
267. copy_constant $28 = 0x40800000 (4.0) | |
268. copy_constant $29 = 0x40400000 (3.0) | |
269. copy_constant $30 = 0x40000000 (2.0) | |
270. copy_constant $31 = 0x3F800000 (1.0) | |
271. add_n_floats $0..15 += $16..31 | |
272. copy_4_slots_unmasked _4_m(0..3) = $0..3 | |
273. copy_4_slots_unmasked _4_m(4..7) = $4..7 | |
274. copy_4_slots_unmasked _4_m(8..11) = $8..11 | |
275. copy_4_slots_unmasked _4_m(12..15) = $12..15 | |
276. copy_slot_unmasked $0 = _0_ok | |
277. copy_4_slots_unmasked $1..4 = _4_m(0..3) | |
278. copy_4_slots_unmasked $5..8 = _4_m(4..7) | |
279. copy_4_slots_unmasked $9..12 = _4_m(8..11) | |
280. copy_4_slots_unmasked $13..16 = _4_m(12..15) | |
281. copy_constant $17 = 0x41880000 (17.0) | |
282. copy_constant $18 = 0x41880000 (17.0) | |
283. copy_constant $19 = 0x41880000 (17.0) | |
284. copy_constant $20 = 0x41880000 (17.0) | |
285. copy_constant $21 = 0x41880000 (17.0) | |
286. copy_constant $22 = 0x41880000 (17.0) | |
287. copy_constant $23 = 0x41880000 (17.0) | |
288. copy_constant $24 = 0x41880000 (17.0) | |
289. copy_constant $25 = 0x41880000 (17.0) | |
290. copy_constant $26 = 0x41880000 (17.0) | |
291. copy_constant $27 = 0x41880000 (17.0) | |
292. copy_constant $28 = 0x41880000 (17.0) | |
293. copy_constant $29 = 0x41880000 (17.0) | |
294. copy_constant $30 = 0x41880000 (17.0) | |
295. copy_constant $31 = 0x41880000 (17.0) | |
296. copy_constant $32 = 0x41880000 (17.0) | |
297. cmpeq_n_floats $1..16 = equal($1..16, $17..32) | |
298. bitwise_and_4_ints $9..12 &= $13..16 | |
299. bitwise_and_4_ints $5..8 &= $9..12 | |
300. bitwise_and_4_ints $1..4 &= $5..8 | |
301. bitwise_and_2_ints $1..2 &= $3..4 | |
302. bitwise_and_int $1 &= $2 | |
303. bitwise_and_int $0 &= $1 | |
304. copy_slot_unmasked _0_ok = $0 | |
305. copy_constant _5_m(0) = 0x41200000 (10.0) | |
306. copy_constant _5_m(1) = 0x41A00000 (20.0) | |
307. copy_constant _5_m(2) = 0x41F00000 (30.0) | |
308. copy_constant _5_m(3) = 0x42200000 (40.0) | |
309. copy_4_slots_unmasked $0..3 = _5_m | |
310. copy_constant $4 = 0x3F800000 (1.0) | |
311. copy_constant $5 = 0x40000000 (2.0) | |
312. copy_constant $6 = 0x40400000 (3.0) | |
313. copy_constant $7 = 0x40800000 (4.0) | |
314. sub_4_floats $0..3 -= $4..7 | |
315. copy_4_slots_unmasked _5_m = $0..3 | |
316. copy_slot_unmasked $0 = _0_ok | |
317. copy_4_slots_unmasked $1..4 = _5_m | |
318. copy_constant $5 = 0x41100000 (9.0) | |
319. copy_constant $6 = 0x41900000 (18.0) | |
320. copy_constant $7 = 0x41D80000 (27.0) | |
321. copy_constant $8 = 0x42100000 (36.0) | |
322. cmpeq_4_floats $1..4 = equal($1..4, $5..8) | |
323. bitwise_and_2_ints $1..2 &= $3..4 | |
324. bitwise_and_int $1 &= $2 | |
325. bitwise_and_int $0 &= $1 | |
326. copy_slot_unmasked _0_ok = $0 | |
327. copy_constant _6_m(0) = 0x40000000 (2.0) | |
328. copy_constant _6_m(1) = 0x40800000 (4.0) | |
329. copy_constant _6_m(2) = 0x40C00000 (6.0) | |
330. copy_constant _6_m(3) = 0x41000000 (8.0) | |
331. copy_4_slots_unmasked $0..3 = _6_m | |
332. copy_constant $4 = 0x40000000 (2.0) | |
333. copy_constant $5 = 0x40000000 (2.0) | |
334. copy_constant $6 = 0x40000000 (2.0) | |
335. copy_constant $7 = 0x40800000 (4.0) | |
336. div_4_floats $0..3 /= $4..7 | |
337. copy_4_slots_unmasked _6_m = $0..3 | |
338. copy_slot_unmasked $0 = _0_ok | |
339. copy_4_slots_unmasked $1..4 = _6_m | |
340. copy_constant $5 = 0x3F800000 (1.0) | |
341. copy_constant $6 = 0x40000000 (2.0) | |
342. copy_constant $7 = 0x40400000 (3.0) | |
343. copy_constant $8 = 0x40000000 (2.0) | |
344. cmpeq_4_floats $1..4 = equal($1..4, $5..8) | |
345. bitwise_and_2_ints $1..2 &= $3..4 | |
346. bitwise_and_int $1 &= $2 | |
347. bitwise_and_int $0 &= $1 | |
348. copy_slot_unmasked _0_ok = $0 | |
349. copy_constant _7_m(0) = 0x3F800000 (1.0) | |
350. copy_constant _7_m(1) = 0x40000000 (2.0) | |
351. copy_constant _7_m(2) = 0x40E00000 (7.0) | |
352. copy_constant _7_m(3) = 0x40800000 (4.0) | |
353. copy_4_slots_unmasked $53..56 = _7_m | |
354. swizzle_3 $54..56 = ($54..56).yxz | |
355. copy_constant $57 = 0x40400000 (3.0) | |
356. copy_constant $58 = 0x40A00000 (5.0) | |
357. copy_constant $59 = 0x40400000 (3.0) | |
358. copy_constant $60 = 0x40000000 (2.0) | |
359. copy_2_slots_unmasked $0..1 = $53..54 | |
360. copy_2_slots_unmasked $2..3 = $57..58 | |
361. mul_2_floats $0..1 *= $2..3 | |
362. add_float $0 += $1 | |
363. copy_2_slots_unmasked $1..2 = $55..56 | |
364. copy_2_slots_unmasked $3..4 = $57..58 | |
365. mul_2_floats $1..2 *= $3..4 | |
366. add_float $1 += $2 | |
367. copy_2_slots_unmasked $2..3 = $53..54 | |
368. copy_2_slots_unmasked $4..5 = $59..60 | |
369. mul_2_floats $2..3 *= $4..5 | |
370. add_float $2 += $3 | |
371. copy_2_slots_unmasked $3..4 = $55..56 | |
372. copy_2_slots_unmasked $5..6 = $59..60 | |
373. mul_2_floats $3..4 *= $5..6 | |
374. add_float $3 += $4 | |
375. copy_4_slots_unmasked _7_m = $0..3 | |
376. copy_slot_unmasked $0 = _0_ok | |
377. copy_4_slots_unmasked $1..4 = _7_m | |
378. copy_constant $5 = 0x42180000 (38.0) | |
379. copy_constant $6 = 0x41D00000 (26.0) | |
380. copy_constant $7 = 0x41880000 (17.0) | |
381. copy_constant $8 = 0x41600000 (14.0) | |
382. cmpeq_4_floats $1..4 = equal($1..4, $5..8) | |
383. bitwise_and_2_ints $1..2 &= $3..4 | |
384. bitwise_and_int $1 &= $2 | |
385. bitwise_and_int $0 &= $1 | |
386. copy_slot_unmasked _0_ok = $0 | |
387. copy_constant _8_m(0) = 0x41200000 (10.0) | |
388. copy_constant _8_m(1) = 0x40800000 (4.0) | |
389. copy_constant _8_m(2) = 0x40000000 (2.0) | |
390. copy_constant _8_m(3) = 0x41A00000 (20.0) | |
391. copy_constant _8_m(4) = 0x40A00000 (5.0) | |
392. copy_constant _8_m(5) = 0x40400000 (3.0) | |
393. copy_constant _8_m(6) = 0x41200000 (10.0) | |
394. copy_constant _8_m(7) = 0x40C00000 (6.0) | |
395. copy_constant _8_m(8) = 0x40A00000 (5.0) | |
396. copy_4_slots_unmasked $53..56 = _8_m(0..3) | |
397. copy_4_slots_unmasked $57..60 = _8_m(4..7) | |
398. copy_slot_unmasked $61 = _8_m(8) | |
399. shuffle $54..61 = ($54..61)[2 5 0 3 6 1 4 7] | |
400. copy_constant $62 = 0x40400000 (3.0) | |
401. copy_constant $63 = 0x40400000 (3.0) | |
402. copy_constant $64 = 0x40800000 (4.0) | |
403. copy_constant $65 = 0x40000000 (2.0) | |
404. copy_constant $66 = 0x40400000 (3.0) | |
405. copy_constant $67 = 0x40800000 (4.0) | |
406. copy_constant $68 = 0x40800000 (4.0) | |
407. copy_constant $69 = 0x41100000 (9.0) | |
408. copy_constant $70 = 0x40000000 (2.0) | |
409. copy_3_slots_unmasked $0..2 = $53..55 | |
410. copy_3_slots_unmasked $3..5 = $62..64 | |
411. mul_3_floats $0..2 *= $3..5 | |
412. add_float $1 += $2 | |
413. add_float $0 += $1 | |
414. copy_3_slots_unmasked $1..3 = $56..58 | |
415. copy_3_slots_unmasked $4..6 = $62..64 | |
416. mul_3_floats $1..3 *= $4..6 | |
417. add_float $2 += $3 | |
418. add_float $1 += $2 | |
419. copy_3_slots_unmasked $2..4 = $59..61 | |
420. copy_3_slots_unmasked $5..7 = $62..64 | |
421. mul_3_floats $2..4 *= $5..7 | |
422. add_float $3 += $4 | |
423. add_float $2 += $3 | |
424. copy_3_slots_unmasked $3..5 = $53..55 | |
425. copy_3_slots_unmasked $6..8 = $65..67 | |
426. mul_3_floats $3..5 *= $6..8 | |
427. add_float $4 += $5 | |
428. add_float $3 += $4 | |
429. copy_3_slots_unmasked $4..6 = $56..58 | |
430. copy_3_slots_unmasked $7..9 = $65..67 | |
431. mul_3_floats $4..6 *= $7..9 | |
432. add_float $5 += $6 | |
433. add_float $4 += $5 | |
434. copy_3_slots_unmasked $5..7 = $59..61 | |
435. copy_3_slots_unmasked $8..10 = $65..67 | |
436. mul_3_floats $5..7 *= $8..10 | |
437. add_float $6 += $7 | |
438. add_float $5 += $6 | |
439. copy_3_slots_unmasked $6..8 = $53..55 | |
440. copy_3_slots_unmasked $9..11 = $68..70 | |
441. mul_3_floats $6..8 *= $9..11 | |
442. add_float $7 += $8 | |
443. add_float $6 += $7 | |
444. copy_3_slots_unmasked $7..9 = $56..58 | |
445. copy_3_slots_unmasked $10..12 = $68..70 | |
446. mul_3_floats $7..9 *= $10..12 | |
447. add_float $8 += $9 | |
448. add_float $7 += $8 | |
449. copy_3_slots_unmasked $8..10 = $59..61 | |
450. copy_3_slots_unmasked $11..13 = $68..70 | |
451. mul_3_floats $8..10 *= $11..13 | |
452. add_float $9 += $10 | |
453. add_float $8 += $9 | |
454. copy_4_slots_unmasked _8_m(0..3) = $0..3 | |
455. copy_4_slots_unmasked _8_m(4..7) = $4..7 | |
456. copy_slot_unmasked _8_m(8) = $8 | |
457. copy_slot_unmasked $0 = _0_ok | |
458. copy_4_slots_unmasked $1..4 = _8_m(0..3) | |
459. copy_4_slots_unmasked $5..8 = _8_m(4..7) | |
460. copy_slot_unmasked $9 = _8_m(8) | |
461. copy_constant $10 = 0x43020000 (130.0) | |
462. copy_constant $11 = 0x424C0000 (51.0) | |
463. copy_constant $12 = 0x420C0000 (35.0) | |
464. copy_constant $13 = 0x42F00000 (120.0) | |
465. copy_constant $14 = 0x423C0000 (47.0) | |
466. copy_constant $15 = 0x42040000 (33.0) | |
467. copy_constant $16 = 0x43700000 (240.0) | |
468. copy_constant $17 = 0x42920000 (73.0) | |
469. copy_constant $18 = 0x42340000 (45.0) | |
470. cmpeq_n_floats $1..9 = equal($1..9, $10..18) | |
471. bitwise_and_4_ints $2..5 &= $6..9 | |
472. bitwise_and_2_ints $2..3 &= $4..5 | |
473. bitwise_and_int $2 &= $3 | |
474. bitwise_and_int $1 &= $2 | |
475. bitwise_and_int $0 &= $1 | |
476. copy_slot_unmasked _0_ok = $0 | |
477. store_condition_mask $53 = CondMask | |
478. store_condition_mask $33 = CondMask | |
479. copy_slot_unmasked $34 = _0_ok | |
480. zero_slot_unmasked $54 = 0 | |
481. merge_condition_mask CondMask = $33 & $34 | |
482. branch_if_no_active_lanes branch_if_no_active_lanes +478 (#960) | |
483. copy_constant ok = 0xFFFFFFFF | |
484. copy_constant splat_4(0) = 0x40800000 (4.0) | |
485. copy_constant splat_4(1) = 0x40800000 (4.0) | |
486. copy_constant splat_4(2) = 0x40800000 (4.0) | |
487. copy_constant splat_4(3) = 0x40800000 (4.0) | |
488. copy_constant splat_4(4) = 0x40800000 (4.0) | |
489. copy_constant splat_4(5) = 0x40800000 (4.0) | |
490. copy_constant splat_4(6) = 0x40800000 (4.0) | |
491. copy_constant splat_4(7) = 0x40800000 (4.0) | |
492. copy_constant splat_4(8) = 0x40800000 (4.0) | |
493. copy_constant splat_2(0) = 0x40000000 (2.0) | |
494. copy_constant splat_2(1) = 0x40000000 (2.0) | |
495. copy_constant splat_2(2) = 0x40000000 (2.0) | |
496. copy_constant splat_2(3) = 0x40000000 (2.0) | |
497. copy_constant splat_2(4) = 0x40000000 (2.0) | |
498. copy_constant splat_2(5) = 0x40000000 (2.0) | |
499. copy_constant splat_2(6) = 0x40000000 (2.0) | |
500. copy_constant splat_2(7) = 0x40000000 (2.0) | |
501. copy_constant splat_2(8) = 0x40000000 (2.0) | |
502. stack_rewind | |
503. zero_4_slots_unmasked m(0..3) = 0 | |
504. zero_4_slots_unmasked m(4..7) = 0 | |
505. zero_slot_unmasked m(8) = 0 | |
506. zero_slot_unmasked $55 = 0 | |
507. copy_constant $56 = 0x40000000 (2.0) | |
508. shuffle $55..63 = ($55..63)[1 0 0 0 1 0 0 0 1] | |
509. copy_4_slots_masked m(0..3) = Mask($55..58) | |
510. copy_4_slots_masked m(4..7) = Mask($59..62) | |
511. copy_slot_masked m(8) = Mask($63) | |
512. copy_4_slots_unmasked $55..58 = m(0..3) | |
513. copy_4_slots_unmasked $59..62 = m(4..7) | |
514. copy_slot_unmasked $63 = m(8) | |
515. copy_4_slots_unmasked $64..67 = splat_4(0..3) | |
516. copy_4_slots_unmasked $68..71 = splat_4(4..7) | |
517. copy_slot_unmasked $72 = splat_4(8) | |
518. add_n_floats $55..63 += $64..72 | |
519. copy_4_slots_masked m(0..3) = Mask($55..58) | |
520. copy_4_slots_masked m(4..7) = Mask($59..62) | |
521. copy_slot_masked m(8) = Mask($63) | |
522. copy_slot_unmasked $55 = ok | |
523. copy_4_slots_unmasked $56..59 = m(0..3) | |
524. copy_4_slots_unmasked $60..63 = m(4..7) | |
525. copy_slot_unmasked $64 = m(8) | |
526. copy_constant $65 = 0x40C00000 (6.0) | |
527. copy_constant $66 = 0x40800000 (4.0) | |
528. copy_constant $67 = 0x40800000 (4.0) | |
529. copy_constant $68 = 0x40800000 (4.0) | |
530. copy_constant $69 = 0x40C00000 (6.0) | |
531. copy_constant $70 = 0x40800000 (4.0) | |
532. copy_constant $71 = 0x40800000 (4.0) | |
533. copy_constant $72 = 0x40800000 (4.0) | |
534. copy_constant $73 = 0x40C00000 (6.0) | |
535. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
536. bitwise_and_4_ints $57..60 &= $61..64 | |
537. bitwise_and_2_ints $57..58 &= $59..60 | |
538. bitwise_and_int $57 &= $58 | |
539. bitwise_and_int $56 &= $57 | |
540. bitwise_and_int $55 &= $56 | |
541. copy_slot_masked ok = Mask($55) | |
542. zero_slot_unmasked $55 = 0 | |
543. copy_constant $56 = 0x40000000 (2.0) | |
544. shuffle $55..63 = ($55..63)[1 0 0 0 1 0 0 0 1] | |
545. copy_4_slots_masked m(0..3) = Mask($55..58) | |
546. copy_4_slots_masked m(4..7) = Mask($59..62) | |
547. copy_slot_masked m(8) = Mask($63) | |
548. copy_4_slots_unmasked $55..58 = m(0..3) | |
549. copy_4_slots_unmasked $59..62 = m(4..7) | |
550. copy_slot_unmasked $63 = m(8) | |
551. copy_4_slots_unmasked $64..67 = splat_4(0..3) | |
552. copy_4_slots_unmasked $68..71 = splat_4(4..7) | |
553. copy_slot_unmasked $72 = splat_4(8) | |
554. sub_n_floats $55..63 -= $64..72 | |
555. copy_4_slots_masked m(0..3) = Mask($55..58) | |
556. copy_4_slots_masked m(4..7) = Mask($59..62) | |
557. copy_slot_masked m(8) = Mask($63) | |
558. copy_slot_unmasked $55 = ok | |
559. copy_4_slots_unmasked $56..59 = m(0..3) | |
560. copy_4_slots_unmasked $60..63 = m(4..7) | |
561. copy_slot_unmasked $64 = m(8) | |
562. copy_constant $65 = 0xC0000000 (-2.0) | |
563. copy_constant $66 = 0xC0800000 (-4.0) | |
564. copy_constant $67 = 0xC0800000 (-4.0) | |
565. copy_constant $68 = 0xC0800000 (-4.0) | |
566. copy_constant $69 = 0xC0000000 (-2.0) | |
567. copy_constant $70 = 0xC0800000 (-4.0) | |
568. copy_constant $71 = 0xC0800000 (-4.0) | |
569. copy_constant $72 = 0xC0800000 (-4.0) | |
570. copy_constant $73 = 0xC0000000 (-2.0) | |
571. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
572. bitwise_and_4_ints $57..60 &= $61..64 | |
573. bitwise_and_2_ints $57..58 &= $59..60 | |
574. bitwise_and_int $57 &= $58 | |
575. bitwise_and_int $56 &= $57 | |
576. bitwise_and_int $55 &= $56 | |
577. copy_slot_masked ok = Mask($55) | |
578. zero_slot_unmasked $55 = 0 | |
579. copy_constant $56 = 0x40000000 (2.0) | |
580. shuffle $55..63 = ($55..63)[1 0 0 0 1 0 0 0 1] | |
581. copy_4_slots_masked m(0..3) = Mask($55..58) | |
582. copy_4_slots_masked m(4..7) = Mask($59..62) | |
583. copy_slot_masked m(8) = Mask($63) | |
584. copy_4_slots_unmasked $55..58 = m(0..3) | |
585. copy_4_slots_unmasked $59..62 = m(4..7) | |
586. copy_slot_unmasked $63 = m(8) | |
587. copy_4_slots_unmasked $64..67 = splat_4(0..3) | |
588. copy_4_slots_unmasked $68..71 = splat_4(4..7) | |
589. copy_slot_unmasked $72 = splat_4(8) | |
590. div_n_floats $55..63 /= $64..72 | |
591. copy_4_slots_masked m(0..3) = Mask($55..58) | |
592. copy_4_slots_masked m(4..7) = Mask($59..62) | |
593. copy_slot_masked m(8) = Mask($63) | |
594. copy_slot_unmasked $55 = ok | |
595. copy_4_slots_unmasked $56..59 = m(0..3) | |
596. copy_4_slots_unmasked $60..63 = m(4..7) | |
597. copy_slot_unmasked $64 = m(8) | |
598. zero_slot_unmasked $65 = 0 | |
599. copy_constant $66 = 0x3F000000 (0.5) | |
600. shuffle $65..73 = ($65..73)[1 0 0 0 1 0 0 0 1] | |
601. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
602. bitwise_and_4_ints $57..60 &= $61..64 | |
603. bitwise_and_2_ints $57..58 &= $59..60 | |
604. bitwise_and_int $57 &= $58 | |
605. bitwise_and_int $56 &= $57 | |
606. bitwise_and_int $55 &= $56 | |
607. copy_slot_masked ok = Mask($55) | |
608. copy_4_slots_unmasked $55..58 = splat_4(0..3) | |
609. copy_4_slots_unmasked $59..62 = splat_4(4..7) | |
610. copy_slot_unmasked $63 = splat_4(8) | |
611. copy_4_slots_masked m(0..3) = Mask($55..58) | |
612. copy_4_slots_masked m(4..7) = Mask($59..62) | |
613. copy_slot_masked m(8) = Mask($63) | |
614. copy_4_slots_unmasked $55..58 = m(0..3) | |
615. copy_4_slots_unmasked $59..62 = m(4..7) | |
616. copy_slot_unmasked $63 = m(8) | |
617. zero_slot_unmasked $64 = 0 | |
618. copy_constant $65 = 0x40000000 (2.0) | |
619. shuffle $64..72 = ($64..72)[1 0 0 0 1 0 0 0 1] | |
620. add_n_floats $55..63 += $64..72 | |
621. copy_4_slots_masked m(0..3) = Mask($55..58) | |
622. copy_4_slots_masked m(4..7) = Mask($59..62) | |
623. copy_slot_masked m(8) = Mask($63) | |
624. copy_slot_unmasked $55 = ok | |
625. copy_4_slots_unmasked $56..59 = m(0..3) | |
626. copy_4_slots_unmasked $60..63 = m(4..7) | |
627. copy_slot_unmasked $64 = m(8) | |
628. copy_constant $65 = 0x40C00000 (6.0) | |
629. copy_constant $66 = 0x40800000 (4.0) | |
630. copy_constant $67 = 0x40800000 (4.0) | |
631. copy_constant $68 = 0x40800000 (4.0) | |
632. copy_constant $69 = 0x40C00000 (6.0) | |
633. copy_constant $70 = 0x40800000 (4.0) | |
634. copy_constant $71 = 0x40800000 (4.0) | |
635. copy_constant $72 = 0x40800000 (4.0) | |
636. copy_constant $73 = 0x40C00000 (6.0) | |
637. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
638. bitwise_and_4_ints $57..60 &= $61..64 | |
639. bitwise_and_2_ints $57..58 &= $59..60 | |
640. bitwise_and_int $57 &= $58 | |
641. bitwise_and_int $56 &= $57 | |
642. bitwise_and_int $55 &= $56 | |
643. copy_slot_masked ok = Mask($55) | |
644. copy_4_slots_unmasked $55..58 = splat_4(0..3) | |
645. copy_4_slots_unmasked $59..62 = splat_4(4..7) | |
646. copy_slot_unmasked $63 = splat_4(8) | |
647. copy_4_slots_masked m(0..3) = Mask($55..58) | |
648. copy_4_slots_masked m(4..7) = Mask($59..62) | |
649. copy_slot_masked m(8) = Mask($63) | |
650. copy_4_slots_unmasked $55..58 = m(0..3) | |
651. copy_4_slots_unmasked $59..62 = m(4..7) | |
652. copy_slot_unmasked $63 = m(8) | |
653. zero_slot_unmasked $64 = 0 | |
654. copy_constant $65 = 0x40000000 (2.0) | |
655. shuffle $64..72 = ($64..72)[1 0 0 0 1 0 0 0 1] | |
656. sub_n_floats $55..63 -= $64..72 | |
657. copy_4_slots_masked m(0..3) = Mask($55..58) | |
658. copy_4_slots_masked m(4..7) = Mask($59..62) | |
659. copy_slot_masked m(8) = Mask($63) | |
660. copy_slot_unmasked $55 = ok | |
661. copy_4_slots_unmasked $56..59 = m(0..3) | |
662. copy_4_slots_unmasked $60..63 = m(4..7) | |
663. copy_slot_unmasked $64 = m(8) | |
664. copy_constant $65 = 0x40000000 (2.0) | |
665. copy_constant $66 = 0x40800000 (4.0) | |
666. copy_constant $67 = 0x40800000 (4.0) | |
667. copy_constant $68 = 0x40800000 (4.0) | |
668. copy_constant $69 = 0x40000000 (2.0) | |
669. copy_constant $70 = 0x40800000 (4.0) | |
670. copy_constant $71 = 0x40800000 (4.0) | |
671. copy_constant $72 = 0x40800000 (4.0) | |
672. copy_constant $73 = 0x40000000 (2.0) | |
673. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
674. bitwise_and_4_ints $57..60 &= $61..64 | |
675. bitwise_and_2_ints $57..58 &= $59..60 | |
676. bitwise_and_int $57 &= $58 | |
677. bitwise_and_int $56 &= $57 | |
678. bitwise_and_int $55 &= $56 | |
679. copy_slot_masked ok = Mask($55) | |
680. copy_4_slots_unmasked $55..58 = splat_4(0..3) | |
681. copy_4_slots_unmasked $59..62 = splat_4(4..7) | |
682. copy_slot_unmasked $63 = splat_4(8) | |
683. copy_4_slots_masked m(0..3) = Mask($55..58) | |
684. copy_4_slots_masked m(4..7) = Mask($59..62) | |
685. copy_slot_masked m(8) = Mask($63) | |
686. copy_4_slots_unmasked $55..58 = m(0..3) | |
687. copy_4_slots_unmasked $59..62 = m(4..7) | |
688. copy_slot_unmasked $63 = m(8) | |
689. copy_4_slots_unmasked $64..67 = splat_2(0..3) | |
690. copy_4_slots_unmasked $68..71 = splat_2(4..7) | |
691. copy_slot_unmasked $72 = splat_2(8) | |
692. div_n_floats $55..63 /= $64..72 | |
693. copy_4_slots_masked m(0..3) = Mask($55..58) | |
694. copy_4_slots_masked m(4..7) = Mask($59..62) | |
695. copy_slot_masked m(8) = Mask($63) | |
696. copy_slot_unmasked $55 = ok | |
697. copy_4_slots_unmasked $56..59 = m(0..3) | |
698. copy_4_slots_unmasked $60..63 = m(4..7) | |
699. copy_slot_unmasked $64 = m(8) | |
700. copy_constant $65 = 0x40000000 (2.0) | |
701. copy_constant $66 = 0x40000000 (2.0) | |
702. copy_constant $67 = 0x40000000 (2.0) | |
703. copy_constant $68 = 0x40000000 (2.0) | |
704. copy_constant $69 = 0x40000000 (2.0) | |
705. copy_constant $70 = 0x40000000 (2.0) | |
706. copy_constant $71 = 0x40000000 (2.0) | |
707. copy_constant $72 = 0x40000000 (2.0) | |
708. copy_constant $73 = 0x40000000 (2.0) | |
709. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
710. bitwise_and_4_ints $57..60 &= $61..64 | |
711. bitwise_and_2_ints $57..58 &= $59..60 | |
712. bitwise_and_int $57 &= $58 | |
713. bitwise_and_int $56 &= $57 | |
714. bitwise_and_int $55 &= $56 | |
715. copy_slot_masked ok = Mask($55) | |
716. copy_constant m(0) = 0x3F800000 (1.0) | |
717. copy_constant m(1) = 0x40000000 (2.0) | |
718. copy_constant m(2) = 0x40400000 (3.0) | |
719. copy_constant m(3) = 0x40800000 (4.0) | |
720. copy_constant m(4) = 0x40A00000 (5.0) | |
721. copy_constant m(5) = 0x40C00000 (6.0) | |
722. copy_constant m(6) = 0x40E00000 (7.0) | |
723. copy_constant m(7) = 0x41000000 (8.0) | |
724. copy_constant m(8) = 0x41100000 (9.0) | |
725. copy_constant m(9) = 0x41200000 (10.0) | |
726. copy_constant m(10) = 0x41300000 (11.0) | |
727. copy_constant m(11) = 0x41400000 (12.0) | |
728. copy_constant m(12) = 0x41500000 (13.0) | |
729. copy_constant m(13) = 0x41600000 (14.0) | |
730. copy_constant m(14) = 0x41700000 (15.0) | |
731. copy_constant m(15) = 0x41800000 (16.0) | |
732. copy_4_slots_unmasked $55..58 = m(0..3) | |
733. copy_4_slots_unmasked $59..62 = m(4..7) | |
734. copy_4_slots_unmasked $63..66 = m(8..11) | |
735. copy_4_slots_unmasked $67..70 = m(12..15) | |
736. copy_constant $71 = 0x41800000 (16.0) | |
737. copy_constant $72 = 0x41700000 (15.0) | |
738. copy_constant $73 = 0x41600000 (14.0) | |
739. copy_constant $74 = 0x41500000 (13.0) | |
740. copy_constant $75 = 0x41400000 (12.0) | |
741. copy_constant $76 = 0x41300000 (11.0) | |
742. copy_constant $77 = 0x41200000 (10.0) | |
743. copy_constant $78 = 0x41100000 (9.0) | |
744. copy_constant $79 = 0x41000000 (8.0) | |
745. copy_constant $80 = 0x40E00000 (7.0) | |
746. copy_constant $81 = 0x40C00000 (6.0) | |
747. copy_constant $82 = 0x40A00000 (5.0) | |
748. copy_constant $83 = 0x40800000 (4.0) | |
749. copy_constant $84 = 0x40400000 (3.0) | |
750. copy_constant $85 = 0x40000000 (2.0) | |
751. copy_constant $86 = 0x3F800000 (1.0) | |
752. add_n_floats $55..70 += $71..86 | |
753. copy_4_slots_masked m(0..3) = Mask($55..58) | |
754. copy_4_slots_masked m(4..7) = Mask($59..62) | |
755. copy_4_slots_masked m(8..11) = Mask($63..66) | |
756. copy_4_slots_masked m(12..15) = Mask($67..70) | |
757. copy_slot_unmasked $55 = ok | |
758. copy_4_slots_unmasked $56..59 = m(0..3) | |
759. copy_4_slots_unmasked $60..63 = m(4..7) | |
760. copy_4_slots_unmasked $64..67 = m(8..11) | |
761. copy_4_slots_unmasked $68..71 = m(12..15) | |
762. copy_constant $72 = 0x41880000 (17.0) | |
763. copy_constant $73 = 0x41880000 (17.0) | |
764. copy_constant $74 = 0x41880000 (17.0) | |
765. copy_constant $75 = 0x41880000 (17.0) | |
766. copy_constant $76 = 0x41880000 (17.0) | |
767. copy_constant $77 = 0x41880000 (17.0) | |
768. copy_constant $78 = 0x41880000 (17.0) | |
769. copy_constant $79 = 0x41880000 (17.0) | |
770. copy_constant $80 = 0x41880000 (17.0) | |
771. copy_constant $81 = 0x41880000 (17.0) | |
772. copy_constant $82 = 0x41880000 (17.0) | |
773. copy_constant $83 = 0x41880000 (17.0) | |
774. copy_constant $84 = 0x41880000 (17.0) | |
775. copy_constant $85 = 0x41880000 (17.0) | |
776. copy_constant $86 = 0x41880000 (17.0) | |
777. copy_constant $87 = 0x41880000 (17.0) | |
778. cmpeq_n_floats $56..71 = equal($56..71, $72..87) | |
779. bitwise_and_4_ints $64..67 &= $68..71 | |
780. bitwise_and_4_ints $60..63 &= $64..67 | |
781. bitwise_and_4_ints $56..59 &= $60..63 | |
782. bitwise_and_2_ints $56..57 &= $58..59 | |
783. bitwise_and_int $56 &= $57 | |
784. bitwise_and_int $55 &= $56 | |
785. copy_slot_masked ok = Mask($55) | |
786. copy_constant m(0) = 0x41200000 (10.0) | |
787. copy_constant m(1) = 0x41A00000 (20.0) | |
788. copy_constant m(2) = 0x41F00000 (30.0) | |
789. copy_constant m(3) = 0x42200000 (40.0) | |
790. copy_4_slots_unmasked $55..58 = m | |
791. copy_constant $59 = 0x3F800000 (1.0) | |
792. copy_constant $60 = 0x40000000 (2.0) | |
793. copy_constant $61 = 0x40400000 (3.0) | |
794. copy_constant $62 = 0x40800000 (4.0) | |
795. sub_4_floats $55..58 -= $59..62 | |
796. copy_4_slots_masked m = Mask($55..58) | |
797. copy_slot_unmasked $55 = ok | |
798. copy_4_slots_unmasked $56..59 = m | |
799. copy_constant $60 = 0x41100000 (9.0) | |
800. copy_constant $61 = 0x41900000 (18.0) | |
801. copy_constant $62 = 0x41D80000 (27.0) | |
802. copy_constant $63 = 0x42100000 (36.0) | |
803. cmpeq_4_floats $56..59 = equal($56..59, $60..63) | |
804. bitwise_and_2_ints $56..57 &= $58..59 | |
805. bitwise_and_int $56 &= $57 | |
806. bitwise_and_int $55 &= $56 | |
807. copy_slot_masked ok = Mask($55) | |
808. copy_constant m(0) = 0x40000000 (2.0) | |
809. copy_constant m(1) = 0x40800000 (4.0) | |
810. copy_constant m(2) = 0x40C00000 (6.0) | |
811. copy_constant m(3) = 0x41000000 (8.0) | |
812. copy_4_slots_unmasked $55..58 = m | |
813. copy_constant $59 = 0x40000000 (2.0) | |
814. copy_constant $60 = 0x40000000 (2.0) | |
815. copy_constant $61 = 0x40000000 (2.0) | |
816. copy_constant $62 = 0x40800000 (4.0) | |
817. div_4_floats $55..58 /= $59..62 | |
818. copy_4_slots_masked m = Mask($55..58) | |
819. copy_slot_unmasked $55 = ok | |
820. copy_4_slots_unmasked $56..59 = m | |
821. copy_constant $60 = 0x3F800000 (1.0) | |
822. copy_constant $61 = 0x40000000 (2.0) | |
823. copy_constant $62 = 0x40400000 (3.0) | |
824. copy_constant $63 = 0x40000000 (2.0) | |
825. cmpeq_4_floats $56..59 = equal($56..59, $60..63) | |
826. bitwise_and_2_ints $56..57 &= $58..59 | |
827. bitwise_and_int $56 &= $57 | |
828. bitwise_and_int $55 &= $56 | |
829. copy_slot_masked ok = Mask($55) | |
830. copy_constant m(0) = 0x3F800000 (1.0) | |
831. copy_constant m(1) = 0x40000000 (2.0) | |
832. copy_constant m(2) = 0x40E00000 (7.0) | |
833. copy_constant m(3) = 0x40800000 (4.0) | |
834. copy_4_slots_unmasked $35..38 = m | |
835. swizzle_3 $36..38 = ($36..38).yxz | |
836. copy_constant $39 = 0x40400000 (3.0) | |
837. copy_constant $40 = 0x40A00000 (5.0) | |
838. copy_constant $41 = 0x40400000 (3.0) | |
839. copy_constant $42 = 0x40000000 (2.0) | |
840. copy_2_slots_unmasked $55..56 = $35..36 | |
841. copy_2_slots_unmasked $57..58 = $39..40 | |
842. mul_2_floats $55..56 *= $57..58 | |
843. add_float $55 += $56 | |
844. copy_2_slots_unmasked $56..57 = $37..38 | |
845. copy_2_slots_unmasked $58..59 = $39..40 | |
846. mul_2_floats $56..57 *= $58..59 | |
847. add_float $56 += $57 | |
848. copy_2_slots_unmasked $57..58 = $35..36 | |
849. copy_2_slots_unmasked $59..60 = $41..42 | |
850. mul_2_floats $57..58 *= $59..60 | |
851. add_float $57 += $58 | |
852. copy_2_slots_unmasked $58..59 = $37..38 | |
853. copy_2_slots_unmasked $60..61 = $41..42 | |
854. mul_2_floats $58..59 *= $60..61 | |
855. add_float $58 += $59 | |
856. copy_4_slots_masked m = Mask($55..58) | |
857. copy_slot_unmasked $55 = ok | |
858. copy_4_slots_unmasked $56..59 = m | |
859. copy_constant $60 = 0x42180000 (38.0) | |
860. copy_constant $61 = 0x41D00000 (26.0) | |
861. copy_constant $62 = 0x41880000 (17.0) | |
862. copy_constant $63 = 0x41600000 (14.0) | |
863. cmpeq_4_floats $56..59 = equal($56..59, $60..63) | |
864. bitwise_and_2_ints $56..57 &= $58..59 | |
865. bitwise_and_int $56 &= $57 | |
866. bitwise_and_int $55 &= $56 | |
867. copy_slot_masked ok = Mask($55) | |
868. copy_constant m(0) = 0x41200000 (10.0) | |
869. copy_constant m(1) = 0x40800000 (4.0) | |
870. copy_constant m(2) = 0x40000000 (2.0) | |
871. copy_constant m(3) = 0x41A00000 (20.0) | |
872. copy_constant m(4) = 0x40A00000 (5.0) | |
873. copy_constant m(5) = 0x40400000 (3.0) | |
874. copy_constant m(6) = 0x41200000 (10.0) | |
875. copy_constant m(7) = 0x40C00000 (6.0) | |
876. copy_constant m(8) = 0x40A00000 (5.0) | |
877. copy_4_slots_unmasked $35..38 = m(0..3) | |
878. copy_4_slots_unmasked $39..42 = m(4..7) | |
879. copy_slot_unmasked $43 = m(8) | |
880. shuffle $36..43 = ($36..43)[2 5 0 3 6 1 4 7] | |
881. copy_constant $44 = 0x40400000 (3.0) | |
882. copy_constant $45 = 0x40400000 (3.0) | |
883. copy_constant $46 = 0x40800000 (4.0) | |
884. copy_constant $47 = 0x40000000 (2.0) | |
885. copy_constant $48 = 0x40400000 (3.0) | |
886. copy_constant $49 = 0x40800000 (4.0) | |
887. copy_constant $50 = 0x40800000 (4.0) | |
888. copy_constant $51 = 0x41100000 (9.0) | |
889. copy_constant $52 = 0x40000000 (2.0) | |
890. copy_3_slots_unmasked $55..57 = $35..37 | |
891. copy_3_slots_unmasked $58..60 = $44..46 | |
892. mul_3_floats $55..57 *= $58..60 | |
893. add_float $56 += $57 | |
894. add_float $55 += $56 | |
895. copy_3_slots_unmasked $56..58 = $38..40 | |
896. copy_3_slots_unmasked $59..61 = $44..46 | |
897. mul_3_floats $56..58 *= $59..61 | |
898. add_float $57 += $58 | |
899. add_float $56 += $57 | |
900. copy_3_slots_unmasked $57..59 = $41..43 | |
901. copy_3_slots_unmasked $60..62 = $44..46 | |
902. mul_3_floats $57..59 *= $60..62 | |
903. add_float $58 += $59 | |
904. add_float $57 += $58 | |
905. copy_3_slots_unmasked $58..60 = $35..37 | |
906. copy_3_slots_unmasked $61..63 = $47..49 | |
907. mul_3_floats $58..60 *= $61..63 | |
908. add_float $59 += $60 | |
909. add_float $58 += $59 | |
910. copy_3_slots_unmasked $59..61 = $38..40 | |
911. copy_3_slots_unmasked $62..64 = $47..49 | |
912. mul_3_floats $59..61 *= $62..64 | |
913. add_float $60 += $61 | |
914. add_float $59 += $60 | |
915. copy_3_slots_unmasked $60..62 = $41..43 | |
916. copy_3_slots_unmasked $63..65 = $47..49 | |
917. mul_3_floats $60..62 *= $63..65 | |
918. add_float $61 += $62 | |
919. add_float $60 += $61 | |
920. copy_3_slots_unmasked $61..63 = $35..37 | |
921. copy_3_slots_unmasked $64..66 = $50..52 | |
922. mul_3_floats $61..63 *= $64..66 | |
923. add_float $62 += $63 | |
924. add_float $61 += $62 | |
925. copy_3_slots_unmasked $62..64 = $38..40 | |
926. copy_3_slots_unmasked $65..67 = $50..52 | |
927. mul_3_floats $62..64 *= $65..67 | |
928. add_float $63 += $64 | |
929. add_float $62 += $63 | |
930. copy_3_slots_unmasked $63..65 = $41..43 | |
931. copy_3_slots_unmasked $66..68 = $50..52 | |
932. mul_3_floats $63..65 *= $66..68 | |
933. add_float $64 += $65 | |
934. add_float $63 += $64 | |
935. copy_4_slots_masked m(0..3) = Mask($55..58) | |
936. copy_4_slots_masked m(4..7) = Mask($59..62) | |
937. copy_slot_masked m(8) = Mask($63) | |
938. copy_slot_unmasked $55 = ok | |
939. copy_4_slots_unmasked $56..59 = m(0..3) | |
940. copy_4_slots_unmasked $60..63 = m(4..7) | |
941. copy_slot_unmasked $64 = m(8) | |
942. copy_constant $65 = 0x43020000 (130.0) | |
943. copy_constant $66 = 0x424C0000 (51.0) | |
944. copy_constant $67 = 0x420C0000 (35.0) | |
945. copy_constant $68 = 0x42F00000 (120.0) | |
946. copy_constant $69 = 0x423C0000 (47.0) | |
947. copy_constant $70 = 0x42040000 (33.0) | |
948. copy_constant $71 = 0x43700000 (240.0) | |
949. copy_constant $72 = 0x42920000 (73.0) | |
950. copy_constant $73 = 0x42340000 (45.0) | |
951. cmpeq_n_floats $56..64 = equal($56..64, $65..73) | |
952. bitwise_and_4_ints $57..60 &= $61..64 | |
953. bitwise_and_2_ints $57..58 &= $59..60 | |
954. bitwise_and_int $57 &= $58 | |
955. bitwise_and_int $56 &= $57 | |
956. bitwise_and_int $55 &= $56 | |
957. copy_slot_masked ok = Mask($55) | |
958. copy_slot_masked [test_matrix_op_matrix_half].result = Mask($55) | |
959. copy_slot_masked $54 = Mask($55) | |
960. load_condition_mask CondMask = $33 | |
961. copy_4_constants $0..3 = colorRed | |
962. merge_condition_mask CondMask = $53 & $54 | |
963. copy_4_constants $4..7 = colorGreen | |
964. copy_4_slots_masked $0..3 = Mask($4..7) | |
965. load_condition_mask CondMask = $53 | |
966. copy_4_slots_unmasked [main].result = $0..3 | |
967. load_src src.rgba = [main].result |