Lines Matching refs:dw

54    uint32_t dw;
132 return ((union __intel_value) { .f = (v) }).dw;
429 uint32_t * restrict dw = (uint32_t * restrict) dst;
431 dw[0] =
435 dw[1] =
440 __gen_address(data, &dw[2], values->Buffer[0], 0, 5, 63);
441 dw[2] = v2_address;
442 dw[3] = v2_address >> 32;
445 __gen_address(data, &dw[4], values->Buffer[1], 0, 5, 63);
446 dw[4] = v4_address;
447 dw[5] = v4_address >> 32;
450 __gen_address(data, &dw[6], values->Buffer[2], 0, 5, 63);
451 dw[6] = v6_address;
452 dw[7] = v6_address >> 32;
455 __gen_address(data, &dw[8], values->Buffer[3], 0, 5, 63);
456 dw[8] = v8_address;
457 dw[9] = v8_address >> 32;
471 uint32_t * restrict dw = (uint32_t * restrict) dst;
473 dw[0] =
488 uint32_t * restrict dw = (uint32_t * restrict) dst;
490 dw[0] =
523 uint32_t * restrict dw = (uint32_t * restrict) dst;
525 dw[0] =
538 dw[1] =
566 uint32_t * restrict dw = (uint32_t * restrict) dst;
568 dw[0] =
591 uint32_t * restrict dw = (uint32_t * restrict) dst;
593 dw[0] =
596 dw[1] =
619 uint32_t * restrict dw = (uint32_t * restrict) dst;
621 dw[0] =
625 dw[1] =
629 dw[2] =
632 dw[3] =
635 dw[4] =
638 dw[5] =
656 uint32_t * restrict dw = (uint32_t * restrict) dst;
658 dw[0] =
674 uint32_t * restrict dw = (uint32_t * restrict) dst;
676 dw[0] =
690 uint32_t * restrict dw = (uint32_t * restrict) dst;
692 dw[0] =
698 dw[1] =
715 uint32_t * restrict dw = (uint32_t * restrict) dst;
717 dw[0] =
723 dw[1] =
742 uint32_t * restrict dw = (uint32_t * restrict) dst;
744 dw[0] =
773 uint32_t * restrict dw = (uint32_t * restrict) dst;
775 dw[0] =
795 uint32_t * restrict dw = (uint32_t * restrict) dst;
797 dw[0] =
801 __gen_address(data, &dw[1], values->IndirectPayloadBaseAddress, 0, 0, 63);
802 dw[1] = v1_address;
803 dw[2] = v1_address >> 32;
805 GFX9_MEMORYADDRESSATTRIBUTES_pack(data, &dw[3], &values->IndirectPayloadBaseAddress2);
828 uint32_t * restrict dw = (uint32_t * restrict) dst;
830 dw[0] =
853 uint32_t * restrict dw = (uint32_t * restrict) dst;
855 dw[0] =
875 uint32_t * restrict dw = (uint32_t * restrict) dst;
877 dw[0] =
895 uint32_t * restrict dw = (uint32_t * restrict) dst;
897 dw[0] =
916 uint32_t * restrict dw = (uint32_t * restrict) dst;
918 dw[0] =
933 uint32_t * restrict dw = (uint32_t * restrict) dst;
935 dw[0] =
951 uint32_t * restrict dw = (uint32_t * restrict) dst;
954 __gen_address(data, &dw[0], values->Address, 0, 0, 63);
955 dw[0] = v0_address;
956 dw[1] = v0_address >> 32;
958 GFX9_MEMORYADDRESSATTRIBUTES_pack(data, &dw[2], &values->MemoryAddressAttributes);
1007 uint32_t * restrict dw = (uint32_t * restrict) dst;
1009 dw[0] =
1027 dw[1] =
1034 dw[2] =
1099 uint32_t * restrict dw = (uint32_t * restrict) dst;
1103 dw[0] = v0;
1104 dw[1] = v0 >> 32;
1106 dw[2] =
1115 dw[3] =
1119 dw[4] =
1123 dw[5] =
1127 dw[6] =
1134 dw[7] =
1158 uint32_t * restrict dw = (uint32_t * restrict) dst;
1160 dw[0] =
1170 dw[1] =
1242 uint32_t * restrict dw = (uint32_t * restrict) dst;
1244 dw[0] =
1263 uint32_t * restrict dw = (uint32_t * restrict) dst;
1265 dw[0] =
1391 uint32_t * restrict dw = (uint32_t * restrict) dst;
1393 dw[0] =
1412 dw[1] =
1417 dw[2] =
1421 dw[3] =
1425 dw[4] =
1433 dw[5] =
1443 dw[6] =
1451 dw[7] =
1461 __gen_address(data, &dw[8], values->SurfaceBaseAddress, 0, 0, 63);
1462 dw[8] = v8_address;
1463 dw[9] = v8_address >> 32;
1472 __gen_address(data, &dw[10], values->AuxiliarySurfaceBaseAddress, v10, 12, 63);
1473 dw[10] = v10_address;
1474 dw[11] = (v10_address >> 32) | (v10 >> 32);
1476 dw[12] =
1480 dw[13] =
1483 dw[14] =
1486 dw[15] =
1508 uint32_t * restrict dw = (uint32_t * restrict) dst;
1510 dw[0] =
1531 uint32_t * restrict dw = (uint32_t * restrict) dst;
1533 dw[0] =
1537 dw[1] =
1541 dw[2] =
1545 dw[3] =
1638 uint32_t * restrict dw = (uint32_t * restrict) dst;
1640 dw[0] =
1651 dw[1] =
1660 dw[2] =
1664 dw[3] =
1693 uint32_t * restrict dw = (uint32_t * restrict) dst;
1695 dw[0] =
1703 dw[1] =
1707 dw[2] =
1711 dw[3] =
1715 dw[4] = 0;
1717 dw[5] = 0;
1719 dw[6] = 0;
1721 dw[7] = 0;
1737 uint32_t * restrict dw = (uint32_t * restrict) dst;
1739 dw[0] =
1743 dw[1] =
1766 uint32_t * restrict dw = (uint32_t * restrict) dst;
1768 dw[0] =
1774 dw[1] =
1782 dw[2] = v2;
1783 dw[3] = v2 >> 32;
1787 dw[4] = v4;
1788 dw[5] = v4 >> 32;
1792 dw[6] = v6;
1793 dw[7] = v6 >> 32;
1797 dw[8] = v8;
1798 dw[9] = v8 >> 32;
1802 dw[10] = v10;
1803 dw[11] = v10 >> 32;
1807 dw[12] = v12;
1808 dw[13] = v12 >> 32;
1812 dw[14] = v14;
1813 dw[15] = v14 >> 32;
1817 dw[16] = v16;
1818 dw[17] = v16 >> 32;
1822 dw[18] = v18;
1823 dw[19] = v18 >> 32;
1827 dw[20] = v20;
1828 dw[21] = v20 >> 32;
1832 dw[22] = v22;
1833 dw[23] = v22 >> 32;
1837 dw[24] = v24;
1838 dw[25] = v24 >> 32;
1842 dw[26] = v26;
1843 dw[27] = v26 >> 32;
1847 dw[28] = v28;
1848 dw[29] = v28 >> 32;
1852 dw[30] = v30;
1853 dw[31] = v30 >> 32;
1857 dw[32] = v32;
1858 dw[33] = v32 >> 32;
1862 dw[34] = v34;
1863 dw[35] = v34 >> 32;
1867 dw[36] = v36;
1868 dw[37] = v36 >> 32;
1872 dw[38] = v38;
1873 dw[39] = v38 >> 32;
1877 dw[40] = v40;
1878 dw[41] = v40 >> 32;
1882 dw[42] = v42;
1883 dw[43] = v42 >> 32;
1887 dw[44] = v44;
1888 dw[45] = v44 >> 32;
1892 dw[46] = v46;
1893 dw[47] = v46 >> 32;
1897 dw[48] = v48;
1898 dw[49] = v48 >> 32;
1902 dw[50] = v50;
1903 dw[51] = v50 >> 32;
1907 dw[52] = v52;
1908 dw[53] = v52 >> 32;
1912 dw[54] = v54;
1913 dw[55] = v54 >> 32;
1917 dw[56] = v56;
1918 dw[57] = v56 >> 32;
1922 dw[58] = v58;
1923 dw[59] = v58 >> 32;
1927 dw[60] = v60;
1928 dw[61] = v60 >> 32;
1932 dw[62] = v62;
1933 dw[63] = v62 >> 32;
1962 uint32_t * restrict dw = (uint32_t * restrict) dst;
1964 dw[0] =
1970 dw[1] =
1976 dw[2] =
1982 dw[3] =
1990 dw[4] = v4;
1991 dw[5] = v4 >> 32;
1995 dw[8] = v8;
1996 dw[9] = v8 >> 32;
2000 dw[12] = v12;
2001 dw[13] = v12 >> 32;
2005 dw[16] = v16;
2006 dw[17] = v16 >> 32;
2010 dw[20] = v20;
2011 dw[21] = v20 >> 32;
2015 dw[24] = v24;
2016 dw[25] = v24 >> 32;
2020 dw[28] = v28;
2021 dw[29] = v28 >> 32;
2025 dw[32] = v32;
2026 dw[33] = v32 >> 32;
2030 dw[36] = v36;
2031 dw[37] = v36 >> 32;
2035 dw[40] = v40;
2036 dw[41] = v40 >> 32;
2040 dw[44] = v44;
2041 dw[45] = v44 >> 32;
2045 dw[48] = v48;
2046 dw[49] = v48 >> 32;
2050 dw[52] = v52;
2051 dw[53] = v52 >> 32;
2055 dw[56] = v56;
2056 dw[57] = v56 >> 32;
2060 dw[60] = v60;
2061 dw[61] = v60 >> 32;
2065 dw[64] = v64;
2066 dw[65] = v64 >> 32;
2070 dw[68] = v68;
2071 dw[69] = v68 >> 32;
2075 dw[72] = v72;
2076 dw[73] = v72 >> 32;
2080 dw[76] = v76;
2081 dw[77] = v76 >> 32;
2085 dw[80] = v80;
2086 dw[81] = v80 >> 32;
2090 dw[84] = v84;
2091 dw[85] = v84 >> 32;
2095 dw[88] = v88;
2096 dw[89] = v88 >> 32;
2100 dw[92] = v92;
2101 dw[93] = v92 >> 32;
2105 dw[96] = v96;
2106 dw[97] = v96 >> 32;
2110 dw[100] = v100;
2111 dw[101] = v100 >> 32;
2115 dw[104] = v104;
2116 dw[105] = v104 >> 32;
2120 dw[108] = v108;
2121 dw[109] = v108 >> 32;
2125 dw[112] = v112;
2126 dw[113] = v112 >> 32;
2130 dw[116] = v116;
2131 dw[117] = v116 >> 32;
2135 dw[120] = v120;
2136 dw[121] = v120 >> 32;
2140 dw[124] = v124;
2141 dw[125] = v124 >> 32;
2158 uint32_t * restrict dw = (uint32_t * restrict) dst;
2160 dw[0] =
2165 dw[1] =
2256 uint32_t * restrict dw = (uint32_t * restrict) dst;
2258 dw[0] =
2265 dw[1] =
2274 dw[2] =
2280 dw[3] =
2287 dw[4] =
2295 dw[5] =
2301 dw[6] =
2304 dw[7] =
2309 dw[8] =
2315 dw[9] =
2321 dw[10] =
2325 dw[11] =
2331 dw[12] =
2337 dw[13] =
2342 dw[14] =
2346 dw[15] =
2352 dw[16] =
2356 dw[17] =
2360 dw[18] =
2364 dw[19] =
2367 dw[20] =
2371 dw[21] =
2375 dw[22] =
2391 uint32_t * restrict dw = (uint32_t * restrict) dst;
2393 dw[0] =
2421 uint32_t * restrict dw = (uint32_t * restrict) dst;
2423 dw[0] =
2426 dw[1] =
2429 dw[2] =
2432 dw[3] =
2435 dw[4] =
2438 dw[5] =
2441 dw[6] = 0;
2443 dw[7] = 0;
2445 dw[8] =
2448 dw[9] =
2451 dw[10] =
2454 dw[11] =
2457 dw[12] =
2460 dw[13] =
2463 dw[14] =
2466 dw[15] =
2495 uint32_t * restrict dw = (uint32_t * restrict) dst;
2497 dw[0] =
2521 uint32_t * restrict dw = (uint32_t * restrict) dst;
2523 dw[0] =
2543 uint32_t * restrict dw = (uint32_t * restrict) dst;
2551 dw[0] =
2561 dw[1] =
2588 uint32_t * restrict dw = (uint32_t * restrict) dst;
2590 dw[0] =
2610 uint32_t * restrict dw = (uint32_t * restrict) dst;
2613 __gen_address(data, &dw[0], values->Address, 0, 0, 63);
2614 dw[0] = v0_address;
2615 dw[1] = v0_address >> 32;
2617 GFX9_VDENC_SURFACE_CONTROL_BITS_pack(data, &dw[2], &values->PictureFields);
2651 uint32_t * restrict dw = (uint32_t * restrict) dst;
2653 dw[0] =
2660 dw[1] =
2668 dw[2] =
2672 dw[3] =
2693 uint32_t * restrict dw = (uint32_t * restrict) dst;
2695 dw[0] =
2703 __gen_address(data, &dw[1], values->BufferStartingAddress, 0, 0, 63);
2704 dw[1] = v1_address;
2705 dw[2] = v1_address >> 32;
2707 dw[3] =
2729 uint32_t * restrict dw = (uint32_t * restrict) dst;
2731 dw[0] =
2738 dw[1] =
2780 uint32_t * restrict dw = (uint32_t * restrict) dst;
2782 dw[0] =
2792 dw[1] =
2797 dw[2] =
2800 dw[3] =
2803 dw[4] =
2806 dw[5] =
2809 dw[6] =
2843 uint32_t * restrict dw = (uint32_t * restrict) dst;
2845 dw[0] =
2852 dw[1] =
2858 dw[2] =
2892 uint32_t * restrict dw = (uint32_t * restrict) dst;
2894 dw[0] =
2901 dw[1] =
2933 uint32_t * restrict dw = (uint32_t * restrict) dst;
2935 dw[0] =
2942 dw[1] =
2974 uint32_t * restrict dw = (uint32_t * restrict) dst;
2976 dw[0] =
2983 dw[1] =
3015 uint32_t * restrict dw = (uint32_t * restrict) dst;
3017 dw[0] =
3024 dw[1] =
3056 uint32_t * restrict dw = (uint32_t * restrict) dst;
3058 dw[0] =
3065 dw[1] =
3093 uint32_t * restrict dw = (uint32_t * restrict) dst;
3095 dw[0] =
3102 dw[1] =
3129 uint32_t * restrict dw = (uint32_t * restrict) dst;
3131 dw[0] =
3138 dw[1] =
3165 uint32_t * restrict dw = (uint32_t * restrict) dst;
3167 dw[0] =
3174 dw[1] =
3201 uint32_t * restrict dw = (uint32_t * restrict) dst;
3203 dw[0] =
3210 dw[1] =
3237 uint32_t * restrict dw = (uint32_t * restrict) dst;
3239 dw[0] =
3246 dw[1] =
3277 uint32_t * restrict dw = (uint32_t * restrict) dst;
3279 dw[0] =
3290 __gen_address(data, &dw[1], values->BindingTablePoolBaseAddress, v1, 12, 63);
3291 dw[1] = v1_address;
3292 dw[2] = (v1_address >> 32) | (v1 >> 32);
3294 dw[3] =
3322 uint32_t * restrict dw = (uint32_t * restrict) dst;
3324 dw[0] =
3331 dw[1] =
3360 uint32_t * restrict dw = (uint32_t * restrict) dst;
3362 dw[0] =
3369 dw[1] =
3399 uint32_t * restrict dw = (uint32_t * restrict) dst;
3401 dw[0] =
3408 dw[1] =
3411 dw[2] =
3414 dw[3] =
3442 uint32_t * restrict dw = (uint32_t * restrict) dst;
3444 dw[0] =
3451 dw[1] =
3454 dw[2] =
3509 uint32_t * restrict dw = (uint32_t * restrict) dst;
3511 dw[0] =
3518 dw[1] =
3527 dw[2] =
3540 dw[3] =
3571 uint32_t * restrict dw = (uint32_t * restrict) dst;
3573 dw[0] =
3581 GFX9_3DSTATE_CONSTANT_BODY_pack(data, &dw[1], &values->ConstantBody);
3608 uint32_t * restrict dw = (uint32_t * restrict) dst;
3610 dw[0] =
3618 GFX9_3DSTATE_CONSTANT_BODY_pack(data, &dw[1], &values->ConstantBody);
3645 uint32_t * restrict dw = (uint32_t * restrict) dst;
3647 dw[0] =
3655 GFX9_3DSTATE_CONSTANT_BODY_pack(data, &dw[1], &values->ConstantBody);
3682 uint32_t * restrict dw = (uint32_t * restrict) dst;
3684 dw[0] =
3692 GFX9_3DSTATE_CONSTANT_BODY_pack(data, &dw[1], &values->ConstantBody);
3719 uint32_t * restrict dw = (uint32_t * restrict) dst;
3721 dw[0] =
3729 GFX9_3DSTATE_CONSTANT_BODY_pack(data, &dw[1], &values->ConstantBody);
3780 uint32_t * restrict dw = (uint32_t * restrict) dst;
3782 dw[0] =
3789 dw[1] =
3798 __gen_address(data, &dw[2], values->SurfaceBaseAddress, 0, 0, 63);
3799 dw[2] = v2_address;
3800 dw[3] = v2_address >> 32;
3802 dw[4] =
3807 dw[5] =
3812 dw[6] =
3816 dw[7] =
3853 uint32_t * restrict dw = (uint32_t * restrict) dst;
3855 dw[0] =
3863 dw[1] =
3867 dw[2] =
3871 dw[3] =
3934 uint32_t * restrict dw = (uint32_t * restrict) dst;
3936 dw[0] =
3945 dw[1] = v1;
3946 dw[2] = v1 >> 32;
3948 dw[3] =
3961 __gen_address(data, &dw[4], values->ScratchSpaceBasePointer, v4, 10, 63);
3962 dw[4] = v4_address;
3963 dw[5] = (v4_address >> 32) | (v4 >> 32);
3965 dw[6] =
3970 dw[7] =
3978 dw[8] =
3986 dw[9] = v9;
3987 dw[10] = v9 >> 32;
4022 uint32_t * restrict dw = (uint32_t * restrict) dst;
4024 dw[0] =
4031 dw[1] =
4036 dw[2] =
4074 uint32_t * restrict dw = (uint32_t * restrict) dst;
4076 dw[0] =
4083 dw[1] =
4088 dw[2] =
4126 uint32_t * restrict dw = (uint32_t * restrict) dst;
4128 dw[0] =
4135 dw[1] =
4140 dw[2] =
4180 uint32_t * restrict dw = (uint32_t * restrict) dst;
4182 dw[0] =
4189 dw[1] =
4195 dw[2] =
4236 uint32_t * restrict dw = (uint32_t * restrict) dst;
4238 dw[0] =
4245 dw[1] =
4251 dw[2] =
4284 uint32_t * restrict dw = (uint32_t * restrict) dst;
4286 dw[0] =
4297 __gen_address(data, &dw[1], values->GatherPoolBaseAddress, v1, 12, 63);
4298 dw[1] = v1_address;
4299 dw[2] = (v1_address >> 32) | (v1 >> 32);
4301 dw[3] =
4382 uint32_t * restrict dw = (uint32_t * restrict) dst;
4384 dw[0] =
4393 dw[1] = v1;
4394 dw[2] = v1 >> 32;
4396 dw[3] =
4412 __gen_address(data, &dw[4], values->ScratchSpaceBasePointer, v4, 10, 63);
4413 dw[4] = v4_address;
4414 dw[5] = (v4_address >> 32) | (v4 >> 32);
4416 dw[6] =
4425 dw[7] =
4438 dw[8] =
4444 dw[9] =
4477 uint32_t * restrict dw = (uint32_t * restrict) dst;
4479 dw[0] =
4486 dw[1] =
4491 __gen_address(data, &dw[2], values->SurfaceBaseAddress, 0, 0, 63);
4492 dw[2] = v2_address;
4493 dw[3] = v2_address >> 32;
4495 dw[4] =
4555 uint32_t * restrict dw = (uint32_t * restrict) dst;
4557 dw[0] =
4564 dw[1] =
4572 dw[2] =
4580 dw[3] = v3;
4581 dw[4] = v3 >> 32;
4586 __gen_address(data, &dw[5], values->ScratchSpaceBasePointer, v5, 10, 63);
4587 dw[5] = v5_address;
4588 dw[6] = (v5_address >> 32) | (v5 >> 32);
4590 dw[7] =
4602 dw[8] = 0;
4634 uint32_t * restrict dw = (uint32_t * restrict) dst;
4636 dw[0] =
4643 dw[1] =
4648 __gen_address(data, &dw[2], values->BufferStartingAddress, 0, 0, 63);
4649 dw[2] = v2_address;
4650 dw[3] = v2_address >> 32;
4652 dw[4] =
4684 uint32_t * restrict dw = (uint32_t * restrict) dst;
4686 dw[0] =
4693 dw[1] =
4699 dw[2] =
4728 uint32_t * restrict dw = (uint32_t * restrict) dst;
4730 dw[0] =
4737 dw[1] =
4769 uint32_t * restrict dw = (uint32_t * restrict) dst;
4771 dw[0] =
4778 dw[1] =
4808 uint32_t * restrict dw = (uint32_t * restrict) dst;
4810 dw[0] =
4817 dw[1] =
4845 uint32_t * restrict dw = (uint32_t * restrict) dst;
4847 dw[0] =
4854 dw[1] =
4857 dw[2] =
4860 dw[3] =
4863 dw[4] =
4866 dw[5] =
4869 dw[6] =
4872 dw[7] =
4875 dw[8] =
4878 dw[9] =
4881 dw[10] =
4884 dw[11] =
4887 dw[12] =
4890 dw[13] =
4893 dw[14] =
4896 dw[15] =
4899 dw[16] =
4902 dw[17] =
4905 dw[18] =
4908 dw[19] =
4911 dw[20] =
4914 dw[21] =
4917 dw[22] =
4920 dw[23] =
4923 dw[24] =
4926 dw[25] =
4929 dw[26] =
4932 dw[27] =
4935 dw[28] =
4938 dw[29] =
4941 dw[30] =
4944 dw[31] =
4947 dw[32] =
5020 uint32_t * restrict dw = (uint32_t * restrict) dst;
5022 dw[0] =
5031 dw[1] = v1;
5032 dw[2] = v1 >> 32;
5034 dw[3] =
5050 __gen_address(data, &dw[4], values->ScratchSpaceBasePointer, v4, 10, 63);
5051 dw[4] = v4_address;
5052 dw[5] = (v4_address >> 32) | (v4 >> 32);
5054 dw[6] =
5064 dw[7] =
5071 dw[8] = v8;
5072 dw[9] = v8 >> 32;
5076 dw[10] = v10;
5077 dw[11] = v10 >> 32;
5111 uint32_t * restrict dw = (uint32_t * restrict) dst;
5113 dw[0] =
5120 dw[1] =
5177 uint32_t * restrict dw = (uint32_t * restrict) dst;
5179 dw[0] =
5186 dw[1] =
5228 uint32_t * restrict dw = (uint32_t * restrict) dst;
5230 dw[0] =
5237 dw[1] =
5266 uint32_t * restrict dw = (uint32_t * restrict) dst;
5268 dw[0] =
5275 dw[1] =
5304 uint32_t * restrict dw = (uint32_t * restrict) dst;
5306 dw[0] =
5313 dw[1] =
5342 uint32_t * restrict dw = (uint32_t * restrict) dst;
5344 dw[0] =
5351 dw[1] =
5380 uint32_t * restrict dw = (uint32_t * restrict) dst;
5382 dw[0] =
5389 dw[1] =
5462 uint32_t * restrict dw = (uint32_t * restrict) dst;
5464 dw[0] =
5471 dw[1] =
5491 dw[2] =
5494 dw[3] =
5497 dw[4] =
5531 uint32_t * restrict dw = (uint32_t * restrict) dst;
5533 dw[0] =
5540 dw[1] =
5544 dw[2] = __gen_address(data, &dw[2], values->GlobalConstantBufferAddress, 0, 6, 31);
5546 dw[3] = __gen_address(data, &dw[3], values->GlobalConstantBufferAddressHigh, 0, 0, 31);
5570 uint32_t * restrict dw = (uint32_t * restrict) dst;
5572 dw[0] =
5602 uint32_t * restrict dw = (uint32_t * restrict) dst;
5604 dw[0] =
5635 uint32_t * restrict dw = (uint32_t * restrict) dst;
5637 dw[0] =
5644 dw[1] =
5671 uint32_t * restrict dw = (uint32_t * restrict) dst;
5673 dw[0] =
5680 dw[1] =
5707 uint32_t * restrict dw = (uint32_t * restrict) dst;
5709 dw[0] =
5716 dw[1] =
5743 uint32_t * restrict dw = (uint32_t * restrict) dst;
5745 dw[0] =
5752 dw[1] =
5779 uint32_t * restrict dw = (uint32_t * restrict) dst;
5781 dw[0] =
5788 dw[1] =
5815 uint32_t * restrict dw = (uint32_t * restrict) dst;
5817 dw[0] =
5824 dw[1] =
5912 uint32_t * restrict dw = (uint32_t * restrict) dst;
5914 dw[0] =
5921 dw[1] =
5931 dw[2] =
5941 dw[3] =
5951 dw[4] =
5961 dw[5] =
5971 dw[6] =
5981 dw[7] =
5991 dw[8] =
6043 uint32_t * restrict dw = (uint32_t * restrict) dst;
6045 dw[0] =
6052 dw[1] =
6066 dw[2] =
6069 dw[3] =
6072 dw[4] =
6090 dw[5] =
6133 uint32_t * restrict dw = (uint32_t * restrict) dst;
6135 dw[0] =
6148 dw[1] =
6158 dw[2] =
6168 dw[3] =
6178 dw[4] =
6188 dw[5] =
6198 dw[6] =
6208 dw[7] =
6218 dw[8] =
6222 dw[9] =
6232 dw[10] =
6266 uint32_t * restrict dw = (uint32_t * restrict) dst;
6268 dw[0] =
6275 dw[1] =
6324 uint32_t * restrict dw = (uint32_t * restrict) dst;
6326 dw[0] =
6333 dw[1] =
6339 dw[2] =
6342 dw[3] =
6385 uint32_t * restrict dw = (uint32_t * restrict) dst;
6387 dw[0] =
6394 dw[1] =
6402 __gen_address(data, &dw[2], values->SurfaceBaseAddress, 0, 2, 47);
6403 dw[2] = v2_address;
6404 dw[3] = v2_address >> 32;
6406 dw[4] =
6410 __gen_address(data, &dw[5], values->StreamOutputBufferOffsetAddress, 0, 2, 47);
6411 dw[5] = v5_address;
6412 dw[6] = v5_address >> 32;
6414 dw[7] =
6447 uint32_t * restrict dw = (uint32_t * restrict) dst;
6449 dw[0] =
6456 dw[1] =
6462 dw[2] =
6496 uint32_t * restrict dw = (uint32_t * restrict) dst;
6498 dw[0] =
6505 dw[1] =
6511 __gen_address(data, &dw[2], values->SurfaceBaseAddress, 0, 0, 63);
6512 dw[2] = v2_address;
6513 dw[3] = v2_address >> 32;
6515 dw[4] =
6564 uint32_t * restrict dw = (uint32_t * restrict) dst;
6566 dw[0] =
6573 dw[1] =
6581 dw[2] =
6591 dw[3] =
6595 dw[4] =
6640 uint32_t * restrict dw = (uint32_t * restrict) dst;
6642 dw[0] =
6649 dw[1] =
6656 dw[2] =
6659 dw[3] =
6687 uint32_t * restrict dw = (uint32_t * restrict) dst;
6689 dw[0] =
6696 dw[1] =
6726 uint32_t * restrict dw = (uint32_t * restrict) dst;
6728 dw[0] =
6735 dw[1] =
6766 uint32_t * restrict dw = (uint32_t * restrict) dst;
6768 dw[0] =
6775 dw[1] =
6806 uint32_t * restrict dw = (uint32_t * restrict) dst;
6808 dw[0] =
6815 dw[1] =
6846 uint32_t * restrict dw = (uint32_t * restrict) dst;
6848 dw[0] =
6855 dw[1] =
6883 uint32_t * restrict dw = (uint32_t * restrict) dst;
6885 dw[0] =
6915 uint32_t * restrict dw = (uint32_t * restrict) dst;
6917 dw[0] =
6951 uint32_t * restrict dw = (uint32_t * restrict) dst;
6953 dw[0] =
6963 dw[1] =
7021 uint32_t * restrict dw = (uint32_t * restrict) dst;
7023 dw[0] =
7030 dw[1] =
7040 dw[2] =
7050 dw[3] =
7060 dw[4] =
7096 uint32_t * restrict dw = (uint32_t * restrict) dst;
7098 dw[0] =
7105 dw[1] =
7109 dw[2] =
7149 uint32_t * restrict dw = (uint32_t * restrict) dst;
7151 dw[0] =
7158 dw[1] =
7188 uint32_t * restrict dw = (uint32_t * restrict) dst;
7190 dw[0] =
7221 uint32_t * restrict dw = (uint32_t * restrict) dst;
7223 dw[0] =
7230 dw[1] =
7257 uint32_t * restrict dw = (uint32_t * restrict) dst;
7259 dw[0] =
7266 dw[1] =
7293 uint32_t * restrict dw = (uint32_t * restrict) dst;
7295 dw[0] =
7302 dw[1] =
7360 uint32_t * restrict dw = (uint32_t * restrict) dst;
7362 dw[0] =
7371 dw[1] = v1;
7372 dw[2] = v1 >> 32;
7374 dw[3] =
7388 __gen_address(data, &dw[4], values->ScratchSpaceBasePointer, v4, 10, 63);
7389 dw[4] = v4_address;
7390 dw[5] = (v4_address >> 32) | (v4 >> 32);
7392 dw[6] =
7397 dw[7] =
7404 dw[8] =
7474 uint32_t * restrict dw = (uint32_t * restrict) dst;
7476 dw[0] =
7483 dw[1] =
7524 uint32_t * restrict dw = (uint32_t * restrict) dst;
7526 dw[0] =
7533 dw[1] =
7579 uint32_t * restrict dw = (uint32_t * restrict) dst;
7581 dw[0] =
7588 dw[1] =
7604 dw[2] =
7610 dw[3] =
7651 uint32_t * restrict dw = (uint32_t * restrict) dst;
7653 dw[0] =
7660 dw[1] =
7671 dw[2] =
7675 dw[3] =
7679 dw[4] =
7706 uint32_t * restrict dw = (uint32_t * restrict) dst;
7708 dw[0] =
7716 __gen_address(data, &dw[1], values->GPGPUCSRBaseAddress, 0, 12, 63);
7717 dw[1] = v1_address;
7718 dw[2] = v1_address >> 32;
7763 uint32_t * restrict dw = (uint32_t * restrict) dst;
7765 dw[0] =
7774 dw[1] =
7777 dw[2] =
7780 dw[3] =
7783 dw[4] =
7789 dw[5] =
7792 dw[6] = 0;
7794 dw[7] =
7797 dw[8] =
7800 dw[9] = 0;
7802 dw[10] =
7805 dw[11] =
7808 dw[12] =
7811 dw[13] =
7814 dw[14] =
7842 uint32_t * restrict dw = (uint32_t * restrict) dst;
7844 dw[0] =
7851 dw[1] = 0;
7853 dw[2] =
7856 dw[3] =
7884 uint32_t * restrict dw = (uint32_t * restrict) dst;
7886 dw[0] =
7893 dw[1] = 0;
7895 dw[2] =
7898 dw[3] =
7949 uint32_t * restrict dw = (uint32_t * restrict) dst;
7951 dw[0] =
7958 dw[1] =
7961 dw[2] =
7971 dw[3] = __gen_address(data, &dw[3], values->IndirectDataStartAddress, 0, 0, 31);
7973 dw[4] =
7977 dw[5] =
8027 uint32_t * restrict dw = (uint32_t * restrict) dst;
8029 dw[0] =
8036 dw[1] =
8039 dw[2] =
8048 dw[3] = __gen_address(data, &dw[3], values->IndirectDataStartAddress, 0, 0, 31);
8050 dw[4] =
8054 dw[5] =
8058 dw[6] =
8091 uint32_t * restrict dw = (uint32_t * restrict) dst;
8093 dw[0] =
8100 dw[1] =
8103 dw[2] =
8108 dw[3] = 0;
8110 dw[4] =
8113 dw[5] =
8116 dw[6] =
8119 dw[7] =
8122 dw[8] =
8125 dw[9] =
8128 dw[10] =
8131 dw[11] =
8134 dw[12] =
8137 dw[13] =
8140 dw[14] =
8143 dw[15] =
8209 uint32_t * restrict dw = (uint32_t * restrict) dst;
8211 dw[0] =
8218 dw[1] =
8221 dw[2] =
8227 dw[3] =
8230 dw[4] = 0;
8232 dw[5] =
8236 dw[6] =
8242 dw[7] =
8246 dw[8] =
8250 dw[9] =
8254 dw[10] = 0;
8256 dw[11] =
8260 dw[12] =
8264 dw[13] =
8268 dw[14] =
8272 dw[15] =
8276 dw[16] =
8306 uint32_t * restrict dw = (uint32_t * restrict) dst;
8308 dw[0] =
8315 dw[1] =
8378 uint32_t * restrict dw = (uint32_t * restrict) dst;
8380 dw[0] =
8391 __gen_address(data, &dw[1], values->ScratchSpaceBasePointer, v1, 10, 47);
8392 dw[1] = v1_address;
8393 dw[2] = (v1_address >> 32) | (v1 >> 32);
8395 dw[3] =
8400 dw[4] =
8403 dw[5] =
8407 dw[6] =
8412 dw[7] =
8422 dw[8] =
8449 uint32_t * restrict dw = (uint32_t * restrict) dst;
8451 dw[0] =
8474 uint32_t * restrict dw = (uint32_t * restrict) dst;
8476 dw[0] =
8522 uint32_t * restrict dw = (uint32_t * restrict) dst;
8524 dw[0] =
8537 __gen_address(data, &dw[1], values->MemoryAddress, 0, 2, 47);
8538 dw[1] = v1_address;
8539 dw[2] = v1_address >> 32;
8558 uint32_t * restrict dw = (uint32_t * restrict) dst;
8560 dw[0] =
8593 uint32_t * restrict dw = (uint32_t * restrict) dst;
8595 dw[0] =
8606 __gen_address(data, &dw[1], values->BatchBufferStartAddress, 0, 2, 63);
8607 dw[1] = v1_address;
8608 dw[2] = v1_address >> 32;
8632 uint32_t * restrict dw = (uint32_t * restrict) dst;
8634 dw[0] =
8643 __gen_address(data, &dw[1], values->PageBaseAddress, v1, 12, 47);
8644 dw[1] = v1_address;
8645 dw[2] = (v1_address >> 32) | (v1 >> 32);
8674 uint32_t * restrict dw = (uint32_t * restrict) dst;
8676 dw[0] =
8684 dw[1] =
8688 __gen_address(data, &dw[2], values->CompareAddress, 0, 3, 63);
8689 dw[2] = v2_address;
8690 dw[3] = v2_address >> 32;
8715 uint32_t * restrict dw = (uint32_t * restrict) dst;
8717 dw[0] =
8725 __gen_address(data, &dw[1], values->DestinationMemoryAddress, 0, 2, 63);
8726 dw[1] = v1_address;
8727 dw[2] = v1_address >> 32;
8730 __gen_address(data, &dw[3], values->SourceMemoryAddress, 0, 2, 63);
8731 dw[3] = v3_address;
8732 dw[4] = v3_address >> 32;
8776 uint32_t * restrict dw = (uint32_t * restrict) dst;
8778 dw[0] =
8785 dw[1] =
8792 dw[2] = __gen_address(data, &dw[2], values->DisplayBufferBaseAddress, v2, 12, 31);
8816 uint32_t * restrict dw = (uint32_t * restrict) dst;
8818 dw[0] =
8823 dw[1] =
8851 uint32_t * restrict dw = (uint32_t * restrict) dst;
8853 dw[0] =
8859 dw[1] =
8862 dw[2] =
8888 uint32_t * restrict dw = (uint32_t * restrict) dst;
8890 dw[0] =
8897 dw[1] =
8901 __gen_address(data, &dw[2], values->MemoryAddress, 0, 2, 63);
8902 dw[2] = v2_address;
8903 dw[3] = v2_address >> 32;
8926 uint32_t * restrict dw = (uint32_t * restrict) dst;
8928 dw[0] =
8933 dw[1] =
8936 dw[2] =
8964 uint32_t * restrict dw = (uint32_t * restrict) dst;
8966 dw[0] =
8972 dw[1] =
9002 uint32_t * restrict dw = (uint32_t * restrict) dst;
9004 dw[0] =
9011 dw[1] =
9036 uint32_t * restrict dw = (uint32_t * restrict) dst;
9038 dw[0] =
9043 dw[1] =
9047 __gen_address(data, &dw[2], values->MemoryAddress, 0, 6, 63);
9048 dw[2] = v2_address;
9049 dw[3] = v2_address >> 32;
9070 uint32_t * restrict dw = (uint32_t * restrict) dst;
9072 dw[0] =
9096 uint32_t * restrict dw = (uint32_t * restrict) dst;
9098 dw[0] =
9135 uint32_t * restrict dw = (uint32_t * restrict) dst;
9137 dw[0] =
9161 uint32_t * restrict dw = (uint32_t * restrict) dst;
9163 dw[0] =
9190 uint32_t * restrict dw = (uint32_t * restrict) dst;
9192 dw[0] =
9201 __gen_address(data, &dw[1], values->MemoryAddress, v1, 6, 63);
9202 dw[1] = v1_address;
9203 dw[2] = (v1_address >> 32) | (v1 >> 32);
9205 dw[3] =
9228 uint32_t * restrict dw = (uint32_t * restrict) dst;
9230 dw[0] =
9255 uint32_t * restrict dw = (uint32_t * restrict) dst;
9257 dw[0] =
9284 uint32_t * restrict dw = (uint32_t * restrict) dst;
9286 dw[0] =
9294 __gen_address(data, &dw[1], values->DestinationAddress, v1, 2, 63);
9295 dw[1] = v1_address;
9296 dw[2] = (v1_address >> 32) | (v1 >> 32);
9298 dw[3] =
9328 uint32_t * restrict dw = (uint32_t * restrict) dst;
9330 dw[0] =
9337 dw[1] =
9375 uint32_t * restrict dw = (uint32_t * restrict) dst;
9377 dw[0] =
9386 dw[1] =
9390 __gen_address(data, &dw[2], values->SemaphoreAddress, 0, 2, 63);
9391 dw[2] = v2_address;
9392 dw[3] = v2_address >> 32;
9420 uint32_t * restrict dw = (uint32_t * restrict) dst;
9422 dw[0] =
9434 dw[1] = __gen_address(data, &dw[1], values->LogicalContextAddress, v1, 12, 31);
9463 uint32_t * restrict dw = (uint32_t * restrict) dst;
9465 dw[0] =
9494 uint32_t * restrict dw = (uint32_t * restrict) dst;
9496 dw[0] =
9506 __gen_address(data, &dw[1], values->Address, v1, 2, 47);
9507 dw[1] = v1_address;
9508 dw[2] = (v1_address >> 32) | (v1 >> 32);
9512 dw[3] = v3;
9513 dw[4] = v3 >> 32;
9538 uint32_t * restrict dw = (uint32_t * restrict) dst;
9540 dw[0] =
9546 dw[1] =
9549 dw[2] =
9575 uint32_t * restrict dw = (uint32_t * restrict) dst;
9577 dw[0] =
9584 dw[1] =
9588 __gen_address(data, &dw[2], values->MemoryAddress, 0, 2, 63);
9589 dw[2] = v2_address;
9590 dw[3] = v2_address >> 32;
9613 uint32_t * restrict dw = (uint32_t * restrict) dst;
9615 dw[0] =
9620 dw[1] =
9624 __gen_address(data, &dw[2], values->MemoryAddress, 0, 6, 63);
9625 dw[2] = v2_address;
9626 dw[3] = v2_address >> 32;
9646 uint32_t * restrict dw = (uint32_t * restrict) dst;
9648 dw[0] =
9671 uint32_t * restrict dw = (uint32_t * restrict) dst;
9673 dw[0] =
9697 uint32_t * restrict dw = (uint32_t * restrict) dst;
9699 dw[0] =
9722 uint32_t * restrict dw = (uint32_t * restrict) dst;
9724 dw[0] =
9763 uint32_t * restrict dw = (uint32_t * restrict) dst;
9765 dw[0] =
9815 uint32_t * restrict dw = (uint32_t * restrict) dst;
9817 dw[0] =
9882 uint32_t * restrict dw = (uint32_t * restrict) dst;
9884 dw[0] =
9891 dw[1] =
9916 __gen_address(data, &dw[2], values->Address, 0, 2, 47);
9917 dw[2] = v2_address;
9918 dw[3] = v2_address >> 32;
9922 dw[4] = v4;
9923 dw[5] = v4 >> 32;
9976 uint32_t * restrict dw = (uint32_t * restrict) dst;
9978 dw[0] =
9989 __gen_address(data, &dw[1], values->GeneralStateBaseAddress, v1, 12, 63);
9990 dw[1] = v1_address;
9991 dw[2] = (v1_address >> 32) | (v1 >> 32);
9993 dw[3] =
10000 __gen_address(data, &dw[4], values->SurfaceStateBaseAddress, v4, 12, 63);
10001 dw[4] = v4_address;
10002 dw[5] = (v4_address >> 32) | (v4 >> 32);
10008 __gen_address(data, &dw[6], values->DynamicStateBaseAddress, v6, 12, 63);
10009 dw[6] = v6_address;
10010 dw[7] = (v6_address >> 32) | (v6 >> 32);
10016 __gen_address(data, &dw[8], values->IndirectObjectBaseAddress, v8, 12, 63);
10017 dw[8] = v8_address;
10018 dw[9] = (v8_address >> 32) | (v8 >> 32);
10024 __gen_address(data, &dw[10], values->InstructionBaseAddress, v10, 12, 63);
10025 dw[10] = v10_address;
10026 dw[11] = (v10_address >> 32) | (v10 >> 32);
10028 dw[12] =
10032 dw[13] =
10036 dw[14] =
10040 dw[15] =
10048 __gen_address(data, &dw[16], values->BindlessSurfaceStateBaseAddress, v16, 12, 63);
10049 dw[16] = v16_address;
10050 dw[17] = (v16_address >> 32) | (v16 >> 32);
10052 dw[18] =
10080 uint32_t * restrict dw = (uint32_t * restrict) dst;
10082 dw[0] =
10091 dw[1] = __gen_address(data, &dw[1], values->PrefetchPointer, v1, 6, 31);
10117 uint32_t * restrict dw = (uint32_t * restrict) dst;
10119 dw[0] =
10128 dw[1] = v1;
10129 dw[2] = v1 >> 32;
10143 uint32_t * restrict dw = (uint32_t * restrict) dst;
10145 dw[0] =
10160 uint32_t * restrict dw = (uint32_t * restrict) dst;
10162 dw[0] =
10180 uint32_t * restrict dw = (uint32_t * restrict) dst;
10182 dw[0] =
10209 uint32_t * restrict dw = (uint32_t * restrict) dst;
10211 dw[0] =
10253 uint32_t * restrict dw = (uint32_t * restrict) dst;
10255 dw[0] =
10314 uint32_t * restrict dw = (uint32_t * restrict) dst;
10316 dw[0] =
10356 uint32_t * restrict dw = (uint32_t * restrict) dst;
10360 dw[0] = v0;
10361 dw[1] = v0 >> 32;
10375 uint32_t * restrict dw = (uint32_t * restrict) dst;
10379 dw[0] = v0;
10380 dw[1] = v0 >> 32;
10397 uint32_t * restrict dw = (uint32_t * restrict) dst;
10399 dw[0] =
10420 uint32_t * restrict dw = (uint32_t * restrict) dst;
10422 dw[0] =
10442 uint32_t * restrict dw = (uint32_t * restrict) dst;
10446 dw[0] = v0;
10447 dw[1] = v0 >> 32;
10461 uint32_t * restrict dw = (uint32_t * restrict) dst;
10465 dw[0] = v0;
10466 dw[1] = v0 >> 32;
10496 uint32_t * restrict dw = (uint32_t * restrict) dst;
10498 dw[0] =
10531 uint32_t * restrict dw = (uint32_t * restrict) dst;
10533 dw[0] =
10562 uint32_t * restrict dw = (uint32_t * restrict) dst;
10566 dw[0] = v0;
10567 dw[1] = v0 >> 32;
10581 uint32_t * restrict dw = (uint32_t * restrict) dst;
10585 dw[0] = v0;
10586 dw[1] = v0 >> 32;
10611 uint32_t * restrict dw = (uint32_t * restrict) dst;
10613 dw[0] =
10631 uint32_t * restrict dw = (uint32_t * restrict) dst;
10635 dw[0] = v0;
10636 dw[1] = v0 >> 32;
10650 uint32_t * restrict dw = (uint32_t * restrict) dst;
10654 dw[0] = v0;
10655 dw[1] = v0 >> 32;
10669 uint32_t * restrict dw = (uint32_t * restrict) dst;
10673 dw[0] = v0;
10674 dw[1] = v0 >> 32;
10709 uint32_t * restrict dw = (uint32_t * restrict) dst;
10711 dw[0] =
10751 uint32_t * restrict dw = (uint32_t * restrict) dst;
10753 dw[0] =
10777 uint32_t * restrict dw = (uint32_t * restrict) dst;
10786 dw[0] = v0;
10787 dw[1] = v0 >> 32;
10806 uint32_t * restrict dw = (uint32_t * restrict) dst;
10815 dw[0] = v0;
10816 dw[1] = v0 >> 32;
10830 uint32_t * restrict dw = (uint32_t * restrict) dst;
10834 dw[0] = v0;
10835 dw[1] = v0 >> 32;
10857 uint32_t * restrict dw = (uint32_t * restrict) dst;
10859 dw[0] =
10892 uint32_t * restrict dw = (uint32_t * restrict) dst;
10894 dw[0] =
10924 uint32_t * restrict dw = (uint32_t * restrict) dst;
10926 dw[0] =
10961 uint32_t * restrict dw = (uint32_t * restrict) dst;
10963 dw[0] =
11019 uint32_t * restrict dw = (uint32_t * restrict) dst;
11021 dw[0] =
11061 uint32_t * restrict dw = (uint32_t * restrict) dst;
11063 dw[0] =
11079 uint32_t * restrict dw = (uint32_t * restrict) dst;
11083 dw[0] = v0;
11084 dw[1] = v0 >> 32;
11098 uint32_t * restrict dw = (uint32_t * restrict) dst;
11102 dw[0] = v0;
11103 dw[1] = v0 >> 32;
11117 uint32_t * restrict dw = (uint32_t * restrict) dst;
11121 dw[0] = v0;
11122 dw[1] = v0 >> 32;
11136 uint32_t * restrict dw = (uint32_t * restrict) dst;
11140 dw[0] = v0;
11141 dw[1] = v0 >> 32;
11155 uint32_t * restrict dw = (uint32_t * restrict) dst;
11159 dw[0] = v0;
11160 dw[1] = v0 >> 32;
11174 uint32_t * restrict dw = (uint32_t * restrict) dst;
11178 dw[0] = v0;
11179 dw[1] = v0 >> 32;
11193 uint32_t * restrict dw = (uint32_t * restrict) dst;
11197 dw[0] = v0;
11198 dw[1] = v0 >> 32;
11212 uint32_t * restrict dw = (uint32_t * restrict) dst;
11216 dw[0] = v0;
11217 dw[1] = v0 >> 32;
11231 uint32_t * restrict dw = (uint32_t * restrict) dst;
11233 dw[0] =
11248 uint32_t * restrict dw = (uint32_t * restrict) dst;
11250 dw[0] =
11265 uint32_t * restrict dw = (uint32_t * restrict) dst;
11267 dw[0] =
11282 uint32_t * restrict dw = (uint32_t * restrict) dst;
11284 dw[0] =
11308 uint32_t * restrict dw = (uint32_t * restrict) dst;
11310 dw[0] =
11330 uint32_t * restrict dw = (uint32_t * restrict) dst;
11332 dw[0] =
11378 uint32_t * restrict dw = (uint32_t * restrict) dst;
11380 dw[0] =
11435 uint32_t * restrict dw = (uint32_t * restrict) dst;
11437 dw[0] =
11457 uint32_t * restrict dw = (uint32_t * restrict) dst;
11459 dw[0] =
11476 uint32_t * restrict dw = (uint32_t * restrict) dst;
11478 dw[0] =
11504 uint32_t * restrict dw = (uint32_t * restrict) dst;
11506 dw[0] =
11526 uint32_t * restrict dw = (uint32_t * restrict) dst;
11530 dw[0] = v0;
11531 dw[1] = v0 >> 32;