Created
October 29, 2016 19:26
-
-
Save tpruvot/4461672b4ddb65492c797887a37dc35c to your computer and use it in GitHub Desktop.
This file has been truncated, but you can view the full file.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
// | |
// Generated by NVIDIA NVVM Compiler | |
// | |
// Compiler Build ID: UNKNOWN | |
// Driver | |
// Based on LLVM 3.4svn | |
// | |
.version 5.0 | |
.target sm_61, texmode_independent | |
.address_size 64 | |
.const .align 1 .b8 blake2b_sigma[192] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3, 11, 8, 12, 0, 5, 2, 15, 13, 10, 14, 3, 6, 7, 1, 9, 4, 7, 9, 3, 1, 13, 12, 11, 14, 2, 6, 5, 10, 4, 0, 15, 8, 9, 0, 5, 7, 2, 4, 10, 15, 14, 1, 11, 12, 6, 8, 3, 13, 2, 12, 6, 10, 0, 11, 8, 3, 4, 13, 7, 5, 15, 14, 1, 9, 12, 5, 1, 15, 14, 13, 4, 10, 0, 7, 6, 3, 9, 2, 8, 11, 13, 11, 7, 14, 12, 1, 3, 9, 5, 0, 15, 4, 8, 6, 2, 10, 6, 15, 14, 9, 11, 3, 0, 8, 12, 2, 13, 7, 1, 4, 10, 5, 10, 2, 8, 4, 7, 6, 1, 5, 15, 11, 9, 14, 3, 12, 13, 0, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 14, 10, 4, 8, 9, 15, 13, 6, 1, 12, 0, 2, 11, 7, 5, 3}; | |
.func local_listindices8( | |
.param .b64 local_listindices8_param_0, | |
.param .b64 local_listindices8_param_1, | |
.param .b32 local_listindices8_param_2, | |
.param .b64 local_listindices8_param_3 | |
) | |
{ | |
.reg .pred %p<262>; | |
.reg .b32 %r<6608>; | |
.reg .b64 %rd<1941>; | |
ld.param.u64 %rd135, [local_listindices8_param_0]; | |
ld.param.u64 %rd136, [local_listindices8_param_1]; | |
ld.param.u32 %r1504, [local_listindices8_param_2]; | |
ld.param.u64 %rd137, [local_listindices8_param_3]; | |
cvta.to.local.u64 %rd1, %rd137; | |
and.b32 %r1505, %r1504, 65535; | |
bfe.u32 %r1506, %r1504, 16, 6; | |
mul.wide.u32 %rd138, %r1505, 1792; | |
add.s64 %rd139, %rd136, %rd138; | |
mul.wide.u32 %rd140, %r1506, 28; | |
add.s64 %rd141, %rd139, %rd140; | |
ld.global.u32 %r1, [%rd141+12]; | |
and.b32 %r1507, %r1, 65535; | |
add.s64 %rd3, %rd135, 12; | |
bfe.u32 %r1508, %r1, 16, 6; | |
mul.wide.u32 %rd142, %r1507, 1792; | |
add.s64 %rd143, %rd3, %rd142; | |
mul.wide.u32 %rd144, %r1508, 28; | |
add.s64 %rd145, %rd143, %rd144; | |
ld.global.u32 %r2, [%rd145]; | |
and.b32 %r1509, %r2, 65535; | |
add.s64 %rd146, %rd136, 4; | |
mul.wide.u32 %rd147, %r1509, 1792; | |
add.s64 %rd148, %rd146, %rd147; | |
bfe.u32 %r1510, %r2, 16, 6; | |
mul.wide.u32 %rd149, %r1510, 28; | |
add.s64 %rd150, %rd148, %rd149; | |
ld.global.u32 %r3, [%rd150+4]; | |
and.b32 %r1511, %r3, 65535; | |
mul.wide.u32 %rd151, %r1511, 1792; | |
add.s64 %rd152, %rd3, %rd151; | |
bfe.u32 %r1512, %r3, 16, 6; | |
mul.wide.u32 %rd153, %r1512, 28; | |
add.s64 %rd154, %rd152, %rd153; | |
ld.global.u32 %r4, [%rd154+-4]; | |
and.b32 %r1513, %r4, 65535; | |
bfe.u32 %r1514, %r4, 16, 6; | |
mul.wide.u32 %rd155, %r1513, 1792; | |
add.s64 %rd156, %rd146, %rd155; | |
mul.wide.u32 %rd157, %r1514, 28; | |
add.s64 %rd158, %rd156, %rd157; | |
ld.global.u32 %r5, [%rd158]; | |
and.b32 %r1515, %r5, 65535; | |
mul.wide.u32 %rd159, %r1515, 1792; | |
add.s64 %rd160, %rd3, %rd159; | |
bfe.u32 %r1516, %r5, 16, 6; | |
mul.wide.u32 %rd161, %r1516, 28; | |
add.s64 %rd162, %rd160, %rd161; | |
ld.global.u32 %r6, [%rd162+-8]; | |
and.b32 %r1517, %r6, 65535; | |
bfe.u32 %r1518, %r6, 16, 6; | |
mul.wide.u32 %rd163, %r1517, 1792; | |
add.s64 %rd164, %rd136, %rd163; | |
mul.wide.u32 %rd165, %r1518, 28; | |
add.s64 %rd166, %rd164, %rd165; | |
ld.global.u32 %r1519, [%rd166]; | |
and.b32 %r1520, %r1519, 65535; | |
bfe.u32 %r1521, %r1519, 16, 6; | |
mul.wide.u32 %rd167, %r1520, 1792; | |
add.s64 %rd168, %rd135, %rd167; | |
mul.wide.u32 %rd169, %r1521, 28; | |
add.s64 %rd170, %rd168, %rd169; | |
ld.global.u32 %r1522, [%rd170]; | |
and.b32 %r1523, %r1522, 65535; | |
shl.b32 %r1524, %r1523, 6; | |
bfe.u32 %r1525, %r1522, 16, 6; | |
or.b32 %r7, %r1524, %r1525; | |
st.local.u32 [%rd1], %r7; | |
bfe.u32 %r1526, %r1519, 22, 6; | |
mul.wide.u32 %rd171, %r1526, 28; | |
add.s64 %rd172, %rd168, %rd171; | |
ld.global.u32 %r1527, [%rd172]; | |
and.b32 %r1528, %r1527, 65535; | |
shl.b32 %r1529, %r1528, 6; | |
bfe.u32 %r1530, %r1527, 16, 6; | |
or.b32 %r5080, %r1529, %r1530; | |
st.local.u32 [%rd1+4], %r5080; | |
setp.le.u32 %p1, %r7, %r5080; | |
mov.u32 %r5079, %r7; | |
@%p1 bra BB0_2; | |
st.local.u32 [%rd1], %r5080; | |
st.local.u32 [%rd1+4], %r7; | |
mov.u32 %r4276, %r5080; | |
mov.u32 %r5080, %r7; | |
mov.u32 %r5079, %r4276; | |
BB0_2: | |
mov.u32 %r5075, %r5079; | |
mov.u32 %r5076, %r5080; | |
bfe.u32 %r1531, %r6, 22, 6; | |
mul.wide.u32 %rd175, %r1531, 28; | |
add.s64 %rd176, %rd164, %rd175; | |
ld.global.u32 %r1533, [%rd176]; | |
and.b32 %r1534, %r1533, 65535; | |
bfe.u32 %r1535, %r1533, 16, 6; | |
mul.wide.u32 %rd177, %r1534, 1792; | |
add.s64 %rd178, %rd135, %rd177; | |
mul.wide.u32 %rd179, %r1535, 28; | |
add.s64 %rd180, %rd178, %rd179; | |
ld.global.u32 %r1536, [%rd180]; | |
and.b32 %r1537, %r1536, 65535; | |
shl.b32 %r1538, %r1537, 6; | |
bfe.u32 %r1539, %r1536, 16, 6; | |
or.b32 %r11, %r1538, %r1539; | |
st.local.u32 [%rd1+8], %r11; | |
bfe.u32 %r1540, %r1533, 22, 6; | |
mul.wide.u32 %rd181, %r1540, 28; | |
add.s64 %rd182, %rd178, %rd181; | |
ld.global.u32 %r1541, [%rd182]; | |
and.b32 %r1542, %r1541, 65535; | |
shl.b32 %r1543, %r1542, 6; | |
bfe.u32 %r1544, %r1541, 16, 6; | |
or.b32 %r5082, %r1543, %r1544; | |
st.local.u32 [%rd1+12], %r5082; | |
setp.le.u32 %p2, %r11, %r5082; | |
mov.u32 %r5081, %r11; | |
@%p2 bra BB0_4; | |
st.local.u32 [%rd1+8], %r5082; | |
st.local.u32 [%rd1+12], %r11; | |
mov.u32 %r4282, %r5082; | |
mov.u32 %r5082, %r11; | |
mov.u32 %r5081, %r4282; | |
BB0_4: | |
mov.u32 %r14, %r5081; | |
mov.u32 %r13, %r5082; | |
setp.le.u32 %p3, %r5075, %r14; | |
mov.u32 %r5077, %r14; | |
mov.u32 %r5078, %r13; | |
@%p3 bra BB0_6; | |
st.local.u32 [%rd1], %r14; | |
st.local.u32 [%rd1+8], %r5075; | |
st.local.u32 [%rd1+4], %r13; | |
st.local.u32 [%rd1+12], %r5076; | |
mov.u32 %r4279, %r5076; | |
mov.u32 %r4281, %r5075; | |
mov.u32 %r5076, %r13; | |
mov.u32 %r5075, %r14; | |
mov.u32 %r5077, %r4281; | |
mov.u32 %r5078, %r4279; | |
BB0_6: | |
mov.u32 %r5067, %r5075; | |
mov.u32 %r5068, %r5076; | |
mov.u32 %r5069, %r5077; | |
mov.u32 %r5070, %r5078; | |
bfe.u32 %r1546, %r5, 22, 6; | |
mul.wide.u32 %rd185, %r1546, 28; | |
add.s64 %rd186, %rd160, %rd185; | |
ld.global.u32 %r19, [%rd186+-8]; | |
and.b32 %r1547, %r19, 65535; | |
cvt.u64.u32 %rd5, %r1547; | |
bfe.u32 %r1548, %r19, 16, 6; | |
mul.wide.u32 %rd187, %r1547, 1792; | |
add.s64 %rd188, %rd136, %rd187; | |
mul.wide.u32 %rd189, %r1548, 28; | |
add.s64 %rd190, %rd188, %rd189; | |
ld.global.u32 %r1549, [%rd190]; | |
and.b32 %r1550, %r1549, 65535; | |
bfe.u32 %r1551, %r1549, 16, 6; | |
mul.wide.u32 %rd191, %r1550, 1792; | |
add.s64 %rd192, %rd135, %rd191; | |
mul.wide.u32 %rd193, %r1551, 28; | |
add.s64 %rd194, %rd192, %rd193; | |
ld.global.u32 %r1552, [%rd194]; | |
and.b32 %r1553, %r1552, 65535; | |
shl.b32 %r1554, %r1553, 6; | |
bfe.u32 %r1555, %r1552, 16, 6; | |
or.b32 %r20, %r1554, %r1555; | |
st.local.u32 [%rd1+16], %r20; | |
bfe.u32 %r1556, %r1549, 22, 6; | |
mul.wide.u32 %rd195, %r1556, 28; | |
add.s64 %rd196, %rd192, %rd195; | |
ld.global.u32 %r1557, [%rd196]; | |
and.b32 %r1558, %r1557, 65535; | |
shl.b32 %r1559, %r1558, 6; | |
bfe.u32 %r1560, %r1557, 16, 6; | |
or.b32 %r5088, %r1559, %r1560; | |
st.local.u32 [%rd1+20], %r5088; | |
setp.le.u32 %p4, %r20, %r5088; | |
mov.u32 %r5087, %r20; | |
@%p4 bra BB0_8; | |
st.local.u32 [%rd1+16], %r5088; | |
st.local.u32 [%rd1+20], %r20; | |
mov.u32 %r4296, %r5088; | |
mov.u32 %r5088, %r20; | |
mov.u32 %r5087, %r4296; | |
BB0_8: | |
mov.u32 %r5083, %r5087; | |
mov.u32 %r5084, %r5088; | |
bfe.u32 %r1561, %r19, 22, 6; | |
mul.lo.s64 %rd197, %rd5, 1792; | |
add.s64 %rd198, %rd136, %rd197; | |
mul.wide.u32 %rd199, %r1561, 28; | |
add.s64 %rd200, %rd198, %rd199; | |
ld.global.u32 %r1562, [%rd200]; | |
and.b32 %r1563, %r1562, 65535; | |
bfe.u32 %r1564, %r1562, 16, 6; | |
mul.wide.u32 %rd201, %r1563, 1792; | |
add.s64 %rd202, %rd135, %rd201; | |
mul.wide.u32 %rd203, %r1564, 28; | |
add.s64 %rd204, %rd202, %rd203; | |
ld.global.u32 %r1565, [%rd204]; | |
and.b32 %r1566, %r1565, 65535; | |
shl.b32 %r1567, %r1566, 6; | |
bfe.u32 %r1568, %r1565, 16, 6; | |
or.b32 %r24, %r1567, %r1568; | |
st.local.u32 [%rd1+24], %r24; | |
bfe.u32 %r1569, %r1562, 22, 6; | |
mul.wide.u32 %rd205, %r1569, 28; | |
add.s64 %rd206, %rd202, %rd205; | |
ld.global.u32 %r1570, [%rd206]; | |
and.b32 %r1571, %r1570, 65535; | |
shl.b32 %r1572, %r1571, 6; | |
bfe.u32 %r1573, %r1570, 16, 6; | |
or.b32 %r5090, %r1572, %r1573; | |
st.local.u32 [%rd1+28], %r5090; | |
setp.le.u32 %p5, %r24, %r5090; | |
mov.u32 %r5089, %r24; | |
@%p5 bra BB0_10; | |
st.local.u32 [%rd1+24], %r5090; | |
st.local.u32 [%rd1+28], %r24; | |
mov.u32 %r4302, %r5090; | |
mov.u32 %r5090, %r24; | |
mov.u32 %r5089, %r4302; | |
BB0_10: | |
mov.u32 %r27, %r5089; | |
mov.u32 %r26, %r5090; | |
setp.le.u32 %p6, %r5083, %r27; | |
mov.u32 %r5085, %r27; | |
mov.u32 %r5086, %r26; | |
@%p6 bra BB0_12; | |
st.local.u32 [%rd1+16], %r27; | |
st.local.u32 [%rd1+24], %r5083; | |
st.local.u32 [%rd1+20], %r26; | |
st.local.u32 [%rd1+28], %r5084; | |
mov.u32 %r4299, %r5084; | |
mov.u32 %r4301, %r5083; | |
mov.u32 %r5084, %r26; | |
mov.u32 %r5083, %r27; | |
mov.u32 %r5085, %r4301; | |
mov.u32 %r5086, %r4299; | |
BB0_12: | |
mov.u32 %r31, %r5083; | |
mov.u32 %r30, %r5084; | |
mov.u32 %r29, %r5085; | |
mov.u32 %r28, %r5086; | |
setp.le.u32 %p7, %r5067, %r31; | |
mov.u32 %r5071, %r31; | |
mov.u32 %r5072, %r30; | |
mov.u32 %r5073, %r29; | |
mov.u32 %r5074, %r28; | |
@%p7 bra BB0_14; | |
st.local.u32 [%rd1], %r31; | |
st.local.u32 [%rd1+16], %r5067; | |
st.local.u32 [%rd1+4], %r30; | |
st.local.u32 [%rd1+20], %r5068; | |
st.local.u32 [%rd1+8], %r29; | |
st.local.u32 [%rd1+24], %r5069; | |
st.local.u32 [%rd1+12], %r28; | |
st.local.u32 [%rd1+28], %r5070; | |
mov.u32 %r4289, %r5070; | |
mov.u32 %r4291, %r5069; | |
mov.u32 %r4293, %r5068; | |
mov.u32 %r4295, %r5067; | |
mov.u32 %r5070, %r28; | |
mov.u32 %r5069, %r29; | |
mov.u32 %r5068, %r30; | |
mov.u32 %r5067, %r31; | |
mov.u32 %r5071, %r4295; | |
mov.u32 %r5072, %r4293; | |
mov.u32 %r5073, %r4291; | |
mov.u32 %r5074, %r4289; | |
BB0_14: | |
mov.u32 %r5051, %r5067; | |
mov.u32 %r5052, %r5068; | |
mov.u32 %r5053, %r5069; | |
mov.u32 %r5054, %r5070; | |
mov.u32 %r5055, %r5071; | |
mov.u32 %r5056, %r5072; | |
mov.u32 %r5057, %r5073; | |
mov.u32 %r5058, %r5074; | |
and.b32 %r3561, %r4, 65535; | |
mul.wide.u32 %rd1933, %r3561, 1792; | |
add.s64 %rd208, %rd136, %rd1933; | |
bfe.u32 %r1575, %r4, 22, 6; | |
mul.wide.u32 %rd209, %r1575, 28; | |
add.s64 %rd210, %rd208, %rd209; | |
ld.global.u32 %r40, [%rd210+4]; | |
and.b32 %r1576, %r40, 65535; | |
mul.wide.u32 %rd211, %r1576, 1792; | |
add.s64 %rd212, %rd3, %rd211; | |
cvt.u64.u32 %rd6, %r1576; | |
bfe.u32 %r1577, %r40, 16, 6; | |
mul.wide.u32 %rd213, %r1577, 28; | |
add.s64 %rd214, %rd212, %rd213; | |
ld.global.u32 %r41, [%rd214+-8]; | |
and.b32 %r1578, %r41, 65535; | |
cvt.u64.u32 %rd7, %r1578; | |
bfe.u32 %r1579, %r41, 16, 6; | |
mul.wide.u32 %rd215, %r1578, 1792; | |
add.s64 %rd216, %rd136, %rd215; | |
mul.wide.u32 %rd217, %r1579, 28; | |
add.s64 %rd218, %rd216, %rd217; | |
ld.global.u32 %r1580, [%rd218]; | |
and.b32 %r1581, %r1580, 65535; | |
bfe.u32 %r1582, %r1580, 16, 6; | |
mul.wide.u32 %rd219, %r1581, 1792; | |
add.s64 %rd220, %rd135, %rd219; | |
mul.wide.u32 %rd221, %r1582, 28; | |
add.s64 %rd222, %rd220, %rd221; | |
ld.global.u32 %r1583, [%rd222]; | |
and.b32 %r1584, %r1583, 65535; | |
shl.b32 %r1585, %r1584, 6; | |
bfe.u32 %r1586, %r1583, 16, 6; | |
or.b32 %r42, %r1585, %r1586; | |
st.local.u32 [%rd1+32], %r42; | |
bfe.u32 %r1587, %r1580, 22, 6; | |
mul.wide.u32 %rd223, %r1587, 28; | |
add.s64 %rd224, %rd220, %rd223; | |
ld.global.u32 %r1588, [%rd224]; | |
and.b32 %r1589, %r1588, 65535; | |
shl.b32 %r1590, %r1589, 6; | |
bfe.u32 %r1591, %r1588, 16, 6; | |
or.b32 %r5104, %r1590, %r1591; | |
st.local.u32 [%rd1+36], %r5104; | |
setp.le.u32 %p8, %r42, %r5104; | |
mov.u32 %r5103, %r42; | |
@%p8 bra BB0_16; | |
st.local.u32 [%rd1+32], %r5104; | |
st.local.u32 [%rd1+36], %r42; | |
mov.u32 %r4332, %r5104; | |
mov.u32 %r5104, %r42; | |
mov.u32 %r5103, %r4332; | |
BB0_16: | |
mov.u32 %r5099, %r5103; | |
mov.u32 %r5100, %r5104; | |
bfe.u32 %r1592, %r41, 22, 6; | |
mul.lo.s64 %rd225, %rd7, 1792; | |
add.s64 %rd226, %rd136, %rd225; | |
mul.wide.u32 %rd227, %r1592, 28; | |
add.s64 %rd228, %rd226, %rd227; | |
ld.global.u32 %r1593, [%rd228]; | |
and.b32 %r1594, %r1593, 65535; | |
bfe.u32 %r1595, %r1593, 16, 6; | |
mul.wide.u32 %rd229, %r1594, 1792; | |
add.s64 %rd230, %rd135, %rd229; | |
mul.wide.u32 %rd231, %r1595, 28; | |
add.s64 %rd232, %rd230, %rd231; | |
ld.global.u32 %r1596, [%rd232]; | |
and.b32 %r1597, %r1596, 65535; | |
shl.b32 %r1598, %r1597, 6; | |
bfe.u32 %r1599, %r1596, 16, 6; | |
or.b32 %r46, %r1598, %r1599; | |
st.local.u32 [%rd1+40], %r46; | |
bfe.u32 %r1600, %r1593, 22, 6; | |
mul.wide.u32 %rd233, %r1600, 28; | |
add.s64 %rd234, %rd230, %rd233; | |
ld.global.u32 %r1601, [%rd234]; | |
and.b32 %r1602, %r1601, 65535; | |
shl.b32 %r1603, %r1602, 6; | |
bfe.u32 %r1604, %r1601, 16, 6; | |
or.b32 %r5106, %r1603, %r1604; | |
st.local.u32 [%rd1+44], %r5106; | |
setp.le.u32 %p9, %r46, %r5106; | |
mov.u32 %r5105, %r46; | |
@%p9 bra BB0_18; | |
st.local.u32 [%rd1+40], %r5106; | |
st.local.u32 [%rd1+44], %r46; | |
mov.u32 %r4338, %r5106; | |
mov.u32 %r5106, %r46; | |
mov.u32 %r5105, %r4338; | |
BB0_18: | |
mov.u32 %r49, %r5105; | |
mov.u32 %r48, %r5106; | |
setp.le.u32 %p10, %r5099, %r49; | |
mov.u32 %r5101, %r49; | |
mov.u32 %r5102, %r48; | |
@%p10 bra BB0_20; | |
st.local.u32 [%rd1+32], %r49; | |
st.local.u32 [%rd1+40], %r5099; | |
st.local.u32 [%rd1+36], %r48; | |
st.local.u32 [%rd1+44], %r5100; | |
mov.u32 %r4335, %r5100; | |
mov.u32 %r4337, %r5099; | |
mov.u32 %r5100, %r48; | |
mov.u32 %r5099, %r49; | |
mov.u32 %r5101, %r4337; | |
mov.u32 %r5102, %r4335; | |
BB0_20: | |
mov.u32 %r5091, %r5099; | |
mov.u32 %r5092, %r5100; | |
mov.u32 %r5093, %r5101; | |
mov.u32 %r5094, %r5102; | |
mul.lo.s64 %rd235, %rd6, 1792; | |
add.s64 %rd236, %rd3, %rd235; | |
bfe.u32 %r1605, %r40, 22, 6; | |
mul.wide.u32 %rd237, %r1605, 28; | |
add.s64 %rd238, %rd236, %rd237; | |
ld.global.u32 %r54, [%rd238+-8]; | |
and.b32 %r1606, %r54, 65535; | |
cvt.u64.u32 %rd8, %r1606; | |
bfe.u32 %r1607, %r54, 16, 6; | |
mul.wide.u32 %rd239, %r1606, 1792; | |
add.s64 %rd240, %rd136, %rd239; | |
mul.wide.u32 %rd241, %r1607, 28; | |
add.s64 %rd242, %rd240, %rd241; | |
ld.global.u32 %r1608, [%rd242]; | |
and.b32 %r1609, %r1608, 65535; | |
bfe.u32 %r1610, %r1608, 16, 6; | |
mul.wide.u32 %rd243, %r1609, 1792; | |
add.s64 %rd244, %rd135, %rd243; | |
mul.wide.u32 %rd245, %r1610, 28; | |
add.s64 %rd246, %rd244, %rd245; | |
ld.global.u32 %r1611, [%rd246]; | |
and.b32 %r1612, %r1611, 65535; | |
shl.b32 %r1613, %r1612, 6; | |
bfe.u32 %r1614, %r1611, 16, 6; | |
or.b32 %r55, %r1613, %r1614; | |
st.local.u32 [%rd1+48], %r55; | |
bfe.u32 %r1615, %r1608, 22, 6; | |
mul.wide.u32 %rd247, %r1615, 28; | |
add.s64 %rd248, %rd244, %rd247; | |
ld.global.u32 %r1616, [%rd248]; | |
and.b32 %r1617, %r1616, 65535; | |
shl.b32 %r1618, %r1617, 6; | |
bfe.u32 %r1619, %r1616, 16, 6; | |
or.b32 %r5112, %r1618, %r1619; | |
st.local.u32 [%rd1+52], %r5112; | |
setp.le.u32 %p11, %r55, %r5112; | |
mov.u32 %r5111, %r55; | |
@%p11 bra BB0_22; | |
st.local.u32 [%rd1+48], %r5112; | |
st.local.u32 [%rd1+52], %r55; | |
mov.u32 %r4352, %r5112; | |
mov.u32 %r5112, %r55; | |
mov.u32 %r5111, %r4352; | |
BB0_22: | |
mov.u32 %r5107, %r5111; | |
mov.u32 %r5108, %r5112; | |
bfe.u32 %r1620, %r54, 22, 6; | |
mul.lo.s64 %rd249, %rd8, 1792; | |
add.s64 %rd250, %rd136, %rd249; | |
mul.wide.u32 %rd251, %r1620, 28; | |
add.s64 %rd252, %rd250, %rd251; | |
ld.global.u32 %r1621, [%rd252]; | |
and.b32 %r1622, %r1621, 65535; | |
bfe.u32 %r1623, %r1621, 16, 6; | |
mul.wide.u32 %rd253, %r1622, 1792; | |
add.s64 %rd254, %rd135, %rd253; | |
mul.wide.u32 %rd255, %r1623, 28; | |
add.s64 %rd256, %rd254, %rd255; | |
ld.global.u32 %r1624, [%rd256]; | |
and.b32 %r1625, %r1624, 65535; | |
shl.b32 %r1626, %r1625, 6; | |
bfe.u32 %r1627, %r1624, 16, 6; | |
or.b32 %r59, %r1626, %r1627; | |
st.local.u32 [%rd1+56], %r59; | |
bfe.u32 %r1628, %r1621, 22, 6; | |
mul.wide.u32 %rd257, %r1628, 28; | |
add.s64 %rd258, %rd254, %rd257; | |
ld.global.u32 %r1629, [%rd258]; | |
and.b32 %r1630, %r1629, 65535; | |
shl.b32 %r1631, %r1630, 6; | |
bfe.u32 %r1632, %r1629, 16, 6; | |
or.b32 %r5114, %r1631, %r1632; | |
st.local.u32 [%rd1+60], %r5114; | |
setp.le.u32 %p12, %r59, %r5114; | |
mov.u32 %r5113, %r59; | |
@%p12 bra BB0_24; | |
st.local.u32 [%rd1+56], %r5114; | |
st.local.u32 [%rd1+60], %r59; | |
mov.u32 %r4358, %r5114; | |
mov.u32 %r5114, %r59; | |
mov.u32 %r5113, %r4358; | |
BB0_24: | |
mov.u32 %r62, %r5113; | |
mov.u32 %r61, %r5114; | |
setp.le.u32 %p13, %r5107, %r62; | |
mov.u32 %r5109, %r62; | |
mov.u32 %r5110, %r61; | |
@%p13 bra BB0_26; | |
st.local.u32 [%rd1+48], %r62; | |
st.local.u32 [%rd1+56], %r5107; | |
st.local.u32 [%rd1+52], %r61; | |
st.local.u32 [%rd1+60], %r5108; | |
mov.u32 %r4355, %r5108; | |
mov.u32 %r4357, %r5107; | |
mov.u32 %r5108, %r61; | |
mov.u32 %r5107, %r62; | |
mov.u32 %r5109, %r4357; | |
mov.u32 %r5110, %r4355; | |
BB0_26: | |
mov.u32 %r66, %r5107; | |
mov.u32 %r65, %r5108; | |
mov.u32 %r64, %r5109; | |
mov.u32 %r63, %r5110; | |
setp.le.u32 %p14, %r5091, %r66; | |
mov.u32 %r5095, %r66; | |
mov.u32 %r5096, %r65; | |
mov.u32 %r5097, %r64; | |
mov.u32 %r5098, %r63; | |
@%p14 bra BB0_28; | |
st.local.u32 [%rd1+32], %r66; | |
st.local.u32 [%rd1+48], %r5091; | |
st.local.u32 [%rd1+36], %r65; | |
st.local.u32 [%rd1+52], %r5092; | |
st.local.u32 [%rd1+40], %r64; | |
st.local.u32 [%rd1+56], %r5093; | |
st.local.u32 [%rd1+44], %r63; | |
st.local.u32 [%rd1+60], %r5094; | |
mov.u32 %r4345, %r5094; | |
mov.u32 %r4347, %r5093; | |
mov.u32 %r4349, %r5092; | |
mov.u32 %r4351, %r5091; | |
mov.u32 %r5094, %r63; | |
mov.u32 %r5093, %r64; | |
mov.u32 %r5092, %r65; | |
mov.u32 %r5091, %r66; | |
mov.u32 %r5095, %r4351; | |
mov.u32 %r5096, %r4349; | |
mov.u32 %r5097, %r4347; | |
mov.u32 %r5098, %r4345; | |
BB0_28: | |
mov.u32 %r74, %r5091; | |
mov.u32 %r73, %r5092; | |
mov.u32 %r72, %r5093; | |
mov.u32 %r71, %r5094; | |
mov.u32 %r70, %r5095; | |
mov.u32 %r69, %r5096; | |
mov.u32 %r68, %r5097; | |
mov.u32 %r67, %r5098; | |
setp.le.u32 %p15, %r5051, %r74; | |
mov.u32 %r5059, %r74; | |
mov.u32 %r5060, %r73; | |
mov.u32 %r5061, %r72; | |
mov.u32 %r5062, %r71; | |
mov.u32 %r5063, %r70; | |
mov.u32 %r5064, %r69; | |
mov.u32 %r5065, %r68; | |
mov.u32 %r5066, %r67; | |
@%p15 bra BB0_30; | |
st.local.u32 [%rd1], %r74; | |
st.local.u32 [%rd1+32], %r5051; | |
st.local.u32 [%rd1+4], %r73; | |
st.local.u32 [%rd1+36], %r5052; | |
st.local.u32 [%rd1+8], %r72; | |
st.local.u32 [%rd1+40], %r5053; | |
st.local.u32 [%rd1+12], %r71; | |
st.local.u32 [%rd1+44], %r5054; | |
st.local.u32 [%rd1+16], %r70; | |
st.local.u32 [%rd1+48], %r5055; | |
st.local.u32 [%rd1+20], %r69; | |
st.local.u32 [%rd1+52], %r5056; | |
st.local.u32 [%rd1+24], %r68; | |
st.local.u32 [%rd1+56], %r5057; | |
st.local.u32 [%rd1+28], %r67; | |
st.local.u32 [%rd1+60], %r5058; | |
mov.u32 %r4317, %r5058; | |
mov.u32 %r4319, %r5057; | |
mov.u32 %r4321, %r5056; | |
mov.u32 %r4323, %r5055; | |
mov.u32 %r4325, %r5054; | |
mov.u32 %r4327, %r5053; | |
mov.u32 %r4329, %r5052; | |
mov.u32 %r4331, %r5051; | |
mov.u32 %r5058, %r67; | |
mov.u32 %r5057, %r68; | |
mov.u32 %r5056, %r69; | |
mov.u32 %r5055, %r70; | |
mov.u32 %r5054, %r71; | |
mov.u32 %r5053, %r72; | |
mov.u32 %r5052, %r73; | |
mov.u32 %r5051, %r74; | |
mov.u32 %r5059, %r4331; | |
mov.u32 %r5060, %r4329; | |
mov.u32 %r5061, %r4327; | |
mov.u32 %r5062, %r4325; | |
mov.u32 %r5063, %r4323; | |
mov.u32 %r5064, %r4321; | |
mov.u32 %r5065, %r4319; | |
mov.u32 %r5066, %r4317; | |
BB0_30: | |
mov.u32 %r5019, %r5051; | |
mov.u32 %r5020, %r5052; | |
mov.u32 %r5021, %r5053; | |
mov.u32 %r5022, %r5054; | |
mov.u32 %r5023, %r5055; | |
mov.u32 %r5024, %r5056; | |
mov.u32 %r5025, %r5057; | |
mov.u32 %r5026, %r5058; | |
mov.u32 %r5027, %r5059; | |
mov.u32 %r5028, %r5060; | |
mov.u32 %r5029, %r5061; | |
mov.u32 %r5030, %r5062; | |
mov.u32 %r5031, %r5063; | |
mov.u32 %r5032, %r5064; | |
mov.u32 %r5033, %r5065; | |
mov.u32 %r5034, %r5066; | |
bfe.u32 %r1634, %r3, 22, 6; | |
mul.wide.u32 %rd261, %r1634, 28; | |
add.s64 %rd262, %rd152, %rd261; | |
ld.global.u32 %r91, [%rd262+-4]; | |
and.b32 %r1635, %r91, 65535; | |
mul.wide.u32 %rd263, %r1635, 1792; | |
add.s64 %rd264, %rd136, %rd263; | |
bfe.u32 %r1636, %r91, 16, 6; | |
mul.wide.u32 %rd265, %r1636, 28; | |
add.s64 %rd266, %rd264, %rd265; | |
ld.global.u32 %r92, [%rd266+4]; | |
and.b32 %r1637, %r92, 65535; | |
mul.wide.u32 %rd267, %r1637, 1792; | |
add.s64 %rd268, %rd3, %rd267; | |
cvt.u64.u32 %rd9, %r1635; | |
cvt.u64.u32 %rd10, %r1637; | |
bfe.u32 %r1638, %r92, 16, 6; | |
mul.wide.u32 %rd269, %r1638, 28; | |
add.s64 %rd270, %rd268, %rd269; | |
ld.global.u32 %r93, [%rd270+-8]; | |
and.b32 %r1639, %r93, 65535; | |
cvt.u64.u32 %rd11, %r1639; | |
bfe.u32 %r1640, %r93, 16, 6; | |
mul.wide.u32 %rd271, %r1639, 1792; | |
add.s64 %rd272, %rd136, %rd271; | |
mul.wide.u32 %rd273, %r1640, 28; | |
add.s64 %rd274, %rd272, %rd273; | |
ld.global.u32 %r1641, [%rd274]; | |
and.b32 %r1642, %r1641, 65535; | |
bfe.u32 %r1643, %r1641, 16, 6; | |
mul.wide.u32 %rd275, %r1642, 1792; | |
add.s64 %rd276, %rd135, %rd275; | |
mul.wide.u32 %rd277, %r1643, 28; | |
add.s64 %rd278, %rd276, %rd277; | |
ld.global.u32 %r1644, [%rd278]; | |
and.b32 %r1645, %r1644, 65535; | |
shl.b32 %r1646, %r1645, 6; | |
bfe.u32 %r1647, %r1644, 16, 6; | |
or.b32 %r94, %r1646, %r1647; | |
st.local.u32 [%rd1+64], %r94; | |
bfe.u32 %r1648, %r1641, 22, 6; | |
mul.wide.u32 %rd279, %r1648, 28; | |
add.s64 %rd280, %rd276, %rd279; | |
ld.global.u32 %r1649, [%rd280]; | |
and.b32 %r1650, %r1649, 65535; | |
shl.b32 %r1651, %r1650, 6; | |
bfe.u32 %r1652, %r1649, 16, 6; | |
or.b32 %r5144, %r1651, %r1652; | |
st.local.u32 [%rd1+68], %r5144; | |
setp.le.u32 %p16, %r94, %r5144; | |
mov.u32 %r5143, %r94; | |
@%p16 bra BB0_32; | |
st.local.u32 [%rd1+64], %r5144; | |
st.local.u32 [%rd1+68], %r94; | |
mov.u32 %r4420, %r5144; | |
mov.u32 %r5144, %r94; | |
mov.u32 %r5143, %r4420; | |
BB0_32: | |
mov.u32 %r5139, %r5143; | |
mov.u32 %r5140, %r5144; | |
bfe.u32 %r1653, %r93, 22, 6; | |
mul.lo.s64 %rd281, %rd11, 1792; | |
add.s64 %rd282, %rd136, %rd281; | |
mul.wide.u32 %rd283, %r1653, 28; | |
add.s64 %rd284, %rd282, %rd283; | |
ld.global.u32 %r1654, [%rd284]; | |
and.b32 %r1655, %r1654, 65535; | |
bfe.u32 %r1656, %r1654, 16, 6; | |
mul.wide.u32 %rd285, %r1655, 1792; | |
add.s64 %rd286, %rd135, %rd285; | |
mul.wide.u32 %rd287, %r1656, 28; | |
add.s64 %rd288, %rd286, %rd287; | |
ld.global.u32 %r1657, [%rd288]; | |
and.b32 %r1658, %r1657, 65535; | |
shl.b32 %r1659, %r1658, 6; | |
bfe.u32 %r1660, %r1657, 16, 6; | |
or.b32 %r98, %r1659, %r1660; | |
st.local.u32 [%rd1+72], %r98; | |
bfe.u32 %r1661, %r1654, 22, 6; | |
mul.wide.u32 %rd289, %r1661, 28; | |
add.s64 %rd290, %rd286, %rd289; | |
ld.global.u32 %r1662, [%rd290]; | |
and.b32 %r1663, %r1662, 65535; | |
shl.b32 %r1664, %r1663, 6; | |
bfe.u32 %r1665, %r1662, 16, 6; | |
or.b32 %r5146, %r1664, %r1665; | |
st.local.u32 [%rd1+76], %r5146; | |
setp.le.u32 %p17, %r98, %r5146; | |
mov.u32 %r5145, %r98; | |
@%p17 bra BB0_34; | |
st.local.u32 [%rd1+72], %r5146; | |
st.local.u32 [%rd1+76], %r98; | |
mov.u32 %r4426, %r5146; | |
mov.u32 %r5146, %r98; | |
mov.u32 %r5145, %r4426; | |
BB0_34: | |
mov.u32 %r101, %r5145; | |
mov.u32 %r100, %r5146; | |
setp.le.u32 %p18, %r5139, %r101; | |
mov.u32 %r5141, %r101; | |
mov.u32 %r5142, %r100; | |
@%p18 bra BB0_36; | |
st.local.u32 [%rd1+64], %r101; | |
st.local.u32 [%rd1+72], %r5139; | |
st.local.u32 [%rd1+68], %r100; | |
st.local.u32 [%rd1+76], %r5140; | |
mov.u32 %r4423, %r5140; | |
mov.u32 %r4425, %r5139; | |
mov.u32 %r5140, %r100; | |
mov.u32 %r5139, %r101; | |
mov.u32 %r5141, %r4425; | |
mov.u32 %r5142, %r4423; | |
BB0_36: | |
mov.u32 %r5131, %r5139; | |
mov.u32 %r5132, %r5140; | |
mov.u32 %r5133, %r5141; | |
mov.u32 %r5134, %r5142; | |
mul.lo.s64 %rd291, %rd10, 1792; | |
add.s64 %rd292, %rd3, %rd291; | |
bfe.u32 %r1666, %r92, 22, 6; | |
mul.wide.u32 %rd293, %r1666, 28; | |
add.s64 %rd294, %rd292, %rd293; | |
ld.global.u32 %r106, [%rd294+-8]; | |
and.b32 %r1667, %r106, 65535; | |
cvt.u64.u32 %rd12, %r1667; | |
bfe.u32 %r1668, %r106, 16, 6; | |
mul.wide.u32 %rd295, %r1667, 1792; | |
add.s64 %rd296, %rd136, %rd295; | |
mul.wide.u32 %rd297, %r1668, 28; | |
add.s64 %rd298, %rd296, %rd297; | |
ld.global.u32 %r1669, [%rd298]; | |
and.b32 %r1670, %r1669, 65535; | |
bfe.u32 %r1671, %r1669, 16, 6; | |
mul.wide.u32 %rd299, %r1670, 1792; | |
add.s64 %rd300, %rd135, %rd299; | |
mul.wide.u32 %rd301, %r1671, 28; | |
add.s64 %rd302, %rd300, %rd301; | |
ld.global.u32 %r1672, [%rd302]; | |
and.b32 %r1673, %r1672, 65535; | |
shl.b32 %r1674, %r1673, 6; | |
bfe.u32 %r1675, %r1672, 16, 6; | |
or.b32 %r107, %r1674, %r1675; | |
st.local.u32 [%rd1+80], %r107; | |
bfe.u32 %r1676, %r1669, 22, 6; | |
mul.wide.u32 %rd303, %r1676, 28; | |
add.s64 %rd304, %rd300, %rd303; | |
ld.global.u32 %r1677, [%rd304]; | |
and.b32 %r1678, %r1677, 65535; | |
shl.b32 %r1679, %r1678, 6; | |
bfe.u32 %r1680, %r1677, 16, 6; | |
or.b32 %r5152, %r1679, %r1680; | |
st.local.u32 [%rd1+84], %r5152; | |
setp.le.u32 %p19, %r107, %r5152; | |
mov.u32 %r5151, %r107; | |
@%p19 bra BB0_38; | |
st.local.u32 [%rd1+80], %r5152; | |
st.local.u32 [%rd1+84], %r107; | |
mov.u32 %r4440, %r5152; | |
mov.u32 %r5152, %r107; | |
mov.u32 %r5151, %r4440; | |
BB0_38: | |
mov.u32 %r5147, %r5151; | |
mov.u32 %r5148, %r5152; | |
bfe.u32 %r1681, %r106, 22, 6; | |
mul.lo.s64 %rd305, %rd12, 1792; | |
add.s64 %rd306, %rd136, %rd305; | |
mul.wide.u32 %rd307, %r1681, 28; | |
add.s64 %rd308, %rd306, %rd307; | |
ld.global.u32 %r1682, [%rd308]; | |
and.b32 %r1683, %r1682, 65535; | |
bfe.u32 %r1684, %r1682, 16, 6; | |
mul.wide.u32 %rd309, %r1683, 1792; | |
add.s64 %rd310, %rd135, %rd309; | |
mul.wide.u32 %rd311, %r1684, 28; | |
add.s64 %rd312, %rd310, %rd311; | |
ld.global.u32 %r1685, [%rd312]; | |
and.b32 %r1686, %r1685, 65535; | |
shl.b32 %r1687, %r1686, 6; | |
bfe.u32 %r1688, %r1685, 16, 6; | |
or.b32 %r111, %r1687, %r1688; | |
st.local.u32 [%rd1+88], %r111; | |
bfe.u32 %r1689, %r1682, 22, 6; | |
mul.wide.u32 %rd313, %r1689, 28; | |
add.s64 %rd314, %rd310, %rd313; | |
ld.global.u32 %r1690, [%rd314]; | |
and.b32 %r1691, %r1690, 65535; | |
shl.b32 %r1692, %r1691, 6; | |
bfe.u32 %r1693, %r1690, 16, 6; | |
or.b32 %r5154, %r1692, %r1693; | |
st.local.u32 [%rd1+92], %r5154; | |
setp.le.u32 %p20, %r111, %r5154; | |
mov.u32 %r5153, %r111; | |
@%p20 bra BB0_40; | |
st.local.u32 [%rd1+88], %r5154; | |
st.local.u32 [%rd1+92], %r111; | |
mov.u32 %r4446, %r5154; | |
mov.u32 %r5154, %r111; | |
mov.u32 %r5153, %r4446; | |
BB0_40: | |
mov.u32 %r114, %r5153; | |
mov.u32 %r113, %r5154; | |
setp.le.u32 %p21, %r5147, %r114; | |
mov.u32 %r5149, %r114; | |
mov.u32 %r5150, %r113; | |
@%p21 bra BB0_42; | |
st.local.u32 [%rd1+80], %r114; | |
st.local.u32 [%rd1+88], %r5147; | |
st.local.u32 [%rd1+84], %r113; | |
st.local.u32 [%rd1+92], %r5148; | |
mov.u32 %r4443, %r5148; | |
mov.u32 %r4445, %r5147; | |
mov.u32 %r5148, %r113; | |
mov.u32 %r5147, %r114; | |
mov.u32 %r5149, %r4445; | |
mov.u32 %r5150, %r4443; | |
BB0_42: | |
mov.u32 %r118, %r5147; | |
mov.u32 %r117, %r5148; | |
mov.u32 %r116, %r5149; | |
mov.u32 %r115, %r5150; | |
setp.le.u32 %p22, %r5131, %r118; | |
mov.u32 %r5135, %r118; | |
mov.u32 %r5136, %r117; | |
mov.u32 %r5137, %r116; | |
mov.u32 %r5138, %r115; | |
@%p22 bra BB0_44; | |
st.local.u32 [%rd1+64], %r118; | |
st.local.u32 [%rd1+80], %r5131; | |
st.local.u32 [%rd1+68], %r117; | |
st.local.u32 [%rd1+84], %r5132; | |
st.local.u32 [%rd1+72], %r116; | |
st.local.u32 [%rd1+88], %r5133; | |
st.local.u32 [%rd1+76], %r115; | |
st.local.u32 [%rd1+92], %r5134; | |
mov.u32 %r4433, %r5134; | |
mov.u32 %r4435, %r5133; | |
mov.u32 %r4437, %r5132; | |
mov.u32 %r4439, %r5131; | |
mov.u32 %r5134, %r115; | |
mov.u32 %r5133, %r116; | |
mov.u32 %r5132, %r117; | |
mov.u32 %r5131, %r118; | |
mov.u32 %r5135, %r4439; | |
mov.u32 %r5136, %r4437; | |
mov.u32 %r5137, %r4435; | |
mov.u32 %r5138, %r4433; | |
BB0_44: | |
mov.u32 %r5115, %r5131; | |
mov.u32 %r5116, %r5132; | |
mov.u32 %r5117, %r5133; | |
mov.u32 %r5118, %r5134; | |
mov.u32 %r5119, %r5135; | |
mov.u32 %r5120, %r5136; | |
mov.u32 %r5121, %r5137; | |
mov.u32 %r5122, %r5138; | |
mul.lo.s64 %rd315, %rd9, 1792; | |
add.s64 %rd316, %rd136, %rd315; | |
bfe.u32 %r1694, %r91, 22, 6; | |
mul.wide.u32 %rd317, %r1694, 28; | |
add.s64 %rd318, %rd316, %rd317; | |
ld.global.u32 %r127, [%rd318+4]; | |
and.b32 %r1695, %r127, 65535; | |
mul.wide.u32 %rd319, %r1695, 1792; | |
add.s64 %rd320, %rd3, %rd319; | |
cvt.u64.u32 %rd13, %r1695; | |
bfe.u32 %r1696, %r127, 16, 6; | |
mul.wide.u32 %rd321, %r1696, 28; | |
add.s64 %rd322, %rd320, %rd321; | |
ld.global.u32 %r128, [%rd322+-8]; | |
and.b32 %r1697, %r128, 65535; | |
cvt.u64.u32 %rd14, %r1697; | |
bfe.u32 %r1698, %r128, 16, 6; | |
mul.wide.u32 %rd323, %r1697, 1792; | |
add.s64 %rd324, %rd136, %rd323; | |
mul.wide.u32 %rd325, %r1698, 28; | |
add.s64 %rd326, %rd324, %rd325; | |
ld.global.u32 %r1699, [%rd326]; | |
and.b32 %r1700, %r1699, 65535; | |
bfe.u32 %r1701, %r1699, 16, 6; | |
mul.wide.u32 %rd327, %r1700, 1792; | |
add.s64 %rd328, %rd135, %rd327; | |
mul.wide.u32 %rd329, %r1701, 28; | |
add.s64 %rd330, %rd328, %rd329; | |
ld.global.u32 %r1702, [%rd330]; | |
and.b32 %r1703, %r1702, 65535; | |
shl.b32 %r1704, %r1703, 6; | |
bfe.u32 %r1705, %r1702, 16, 6; | |
or.b32 %r129, %r1704, %r1705; | |
st.local.u32 [%rd1+96], %r129; | |
bfe.u32 %r1706, %r1699, 22, 6; | |
mul.wide.u32 %rd331, %r1706, 28; | |
add.s64 %rd332, %rd328, %rd331; | |
ld.global.u32 %r1707, [%rd332]; | |
and.b32 %r1708, %r1707, 65535; | |
shl.b32 %r1709, %r1708, 6; | |
bfe.u32 %r1710, %r1707, 16, 6; | |
or.b32 %r5168, %r1709, %r1710; | |
st.local.u32 [%rd1+100], %r5168; | |
setp.le.u32 %p23, %r129, %r5168; | |
mov.u32 %r5167, %r129; | |
@%p23 bra BB0_46; | |
st.local.u32 [%rd1+96], %r5168; | |
st.local.u32 [%rd1+100], %r129; | |
mov.u32 %r4476, %r5168; | |
mov.u32 %r5168, %r129; | |
mov.u32 %r5167, %r4476; | |
BB0_46: | |
mov.u32 %r5163, %r5167; | |
mov.u32 %r5164, %r5168; | |
bfe.u32 %r1711, %r128, 22, 6; | |
mul.lo.s64 %rd333, %rd14, 1792; | |
add.s64 %rd334, %rd136, %rd333; | |
mul.wide.u32 %rd335, %r1711, 28; | |
add.s64 %rd336, %rd334, %rd335; | |
ld.global.u32 %r1712, [%rd336]; | |
and.b32 %r1713, %r1712, 65535; | |
bfe.u32 %r1714, %r1712, 16, 6; | |
mul.wide.u32 %rd337, %r1713, 1792; | |
add.s64 %rd338, %rd135, %rd337; | |
mul.wide.u32 %rd339, %r1714, 28; | |
add.s64 %rd340, %rd338, %rd339; | |
ld.global.u32 %r1715, [%rd340]; | |
and.b32 %r1716, %r1715, 65535; | |
shl.b32 %r1717, %r1716, 6; | |
bfe.u32 %r1718, %r1715, 16, 6; | |
or.b32 %r133, %r1717, %r1718; | |
st.local.u32 [%rd1+104], %r133; | |
bfe.u32 %r1719, %r1712, 22, 6; | |
mul.wide.u32 %rd341, %r1719, 28; | |
add.s64 %rd342, %rd338, %rd341; | |
ld.global.u32 %r1720, [%rd342]; | |
and.b32 %r1721, %r1720, 65535; | |
shl.b32 %r1722, %r1721, 6; | |
bfe.u32 %r1723, %r1720, 16, 6; | |
or.b32 %r5170, %r1722, %r1723; | |
st.local.u32 [%rd1+108], %r5170; | |
setp.le.u32 %p24, %r133, %r5170; | |
mov.u32 %r5169, %r133; | |
@%p24 bra BB0_48; | |
st.local.u32 [%rd1+104], %r5170; | |
st.local.u32 [%rd1+108], %r133; | |
mov.u32 %r4482, %r5170; | |
mov.u32 %r5170, %r133; | |
mov.u32 %r5169, %r4482; | |
BB0_48: | |
mov.u32 %r136, %r5169; | |
mov.u32 %r135, %r5170; | |
setp.le.u32 %p25, %r5163, %r136; | |
mov.u32 %r5165, %r136; | |
mov.u32 %r5166, %r135; | |
@%p25 bra BB0_50; | |
st.local.u32 [%rd1+96], %r136; | |
st.local.u32 [%rd1+104], %r5163; | |
st.local.u32 [%rd1+100], %r135; | |
st.local.u32 [%rd1+108], %r5164; | |
mov.u32 %r4479, %r5164; | |
mov.u32 %r4481, %r5163; | |
mov.u32 %r5164, %r135; | |
mov.u32 %r5163, %r136; | |
mov.u32 %r5165, %r4481; | |
mov.u32 %r5166, %r4479; | |
BB0_50: | |
mov.u32 %r5155, %r5163; | |
mov.u32 %r5156, %r5164; | |
mov.u32 %r5157, %r5165; | |
mov.u32 %r5158, %r5166; | |
mul.lo.s64 %rd343, %rd13, 1792; | |
add.s64 %rd344, %rd3, %rd343; | |
bfe.u32 %r1724, %r127, 22, 6; | |
mul.wide.u32 %rd345, %r1724, 28; | |
add.s64 %rd346, %rd344, %rd345; | |
ld.global.u32 %r141, [%rd346+-8]; | |
and.b32 %r1725, %r141, 65535; | |
cvt.u64.u32 %rd15, %r1725; | |
bfe.u32 %r1726, %r141, 16, 6; | |
mul.wide.u32 %rd347, %r1725, 1792; | |
add.s64 %rd348, %rd136, %rd347; | |
mul.wide.u32 %rd349, %r1726, 28; | |
add.s64 %rd350, %rd348, %rd349; | |
ld.global.u32 %r1727, [%rd350]; | |
and.b32 %r1728, %r1727, 65535; | |
bfe.u32 %r1729, %r1727, 16, 6; | |
mul.wide.u32 %rd351, %r1728, 1792; | |
add.s64 %rd352, %rd135, %rd351; | |
mul.wide.u32 %rd353, %r1729, 28; | |
add.s64 %rd354, %rd352, %rd353; | |
ld.global.u32 %r1730, [%rd354]; | |
and.b32 %r1731, %r1730, 65535; | |
shl.b32 %r1732, %r1731, 6; | |
bfe.u32 %r1733, %r1730, 16, 6; | |
or.b32 %r142, %r1732, %r1733; | |
st.local.u32 [%rd1+112], %r142; | |
bfe.u32 %r1734, %r1727, 22, 6; | |
mul.wide.u32 %rd355, %r1734, 28; | |
add.s64 %rd356, %rd352, %rd355; | |
ld.global.u32 %r1735, [%rd356]; | |
and.b32 %r1736, %r1735, 65535; | |
shl.b32 %r1737, %r1736, 6; | |
bfe.u32 %r1738, %r1735, 16, 6; | |
or.b32 %r5176, %r1737, %r1738; | |
st.local.u32 [%rd1+116], %r5176; | |
setp.le.u32 %p26, %r142, %r5176; | |
mov.u32 %r5175, %r142; | |
@%p26 bra BB0_52; | |
st.local.u32 [%rd1+112], %r5176; | |
st.local.u32 [%rd1+116], %r142; | |
mov.u32 %r4496, %r5176; | |
mov.u32 %r5176, %r142; | |
mov.u32 %r5175, %r4496; | |
BB0_52: | |
mov.u32 %r5171, %r5175; | |
mov.u32 %r5172, %r5176; | |
bfe.u32 %r1739, %r141, 22, 6; | |
mul.lo.s64 %rd357, %rd15, 1792; | |
add.s64 %rd358, %rd136, %rd357; | |
mul.wide.u32 %rd359, %r1739, 28; | |
add.s64 %rd360, %rd358, %rd359; | |
ld.global.u32 %r1740, [%rd360]; | |
and.b32 %r1741, %r1740, 65535; | |
bfe.u32 %r1742, %r1740, 16, 6; | |
mul.wide.u32 %rd361, %r1741, 1792; | |
add.s64 %rd362, %rd135, %rd361; | |
mul.wide.u32 %rd363, %r1742, 28; | |
add.s64 %rd364, %rd362, %rd363; | |
ld.global.u32 %r1743, [%rd364]; | |
and.b32 %r1744, %r1743, 65535; | |
shl.b32 %r1745, %r1744, 6; | |
bfe.u32 %r1746, %r1743, 16, 6; | |
or.b32 %r146, %r1745, %r1746; | |
st.local.u32 [%rd1+120], %r146; | |
bfe.u32 %r1747, %r1740, 22, 6; | |
mul.wide.u32 %rd365, %r1747, 28; | |
add.s64 %rd366, %rd362, %rd365; | |
ld.global.u32 %r1748, [%rd366]; | |
and.b32 %r1749, %r1748, 65535; | |
shl.b32 %r1750, %r1749, 6; | |
bfe.u32 %r1751, %r1748, 16, 6; | |
or.b32 %r5178, %r1750, %r1751; | |
st.local.u32 [%rd1+124], %r5178; | |
setp.le.u32 %p27, %r146, %r5178; | |
mov.u32 %r5177, %r146; | |
@%p27 bra BB0_54; | |
st.local.u32 [%rd1+120], %r5178; | |
st.local.u32 [%rd1+124], %r146; | |
mov.u32 %r4502, %r5178; | |
mov.u32 %r5178, %r146; | |
mov.u32 %r5177, %r4502; | |
BB0_54: | |
mov.u32 %r149, %r5177; | |
mov.u32 %r148, %r5178; | |
setp.le.u32 %p28, %r5171, %r149; | |
mov.u32 %r5173, %r149; | |
mov.u32 %r5174, %r148; | |
@%p28 bra BB0_56; | |
st.local.u32 [%rd1+112], %r149; | |
st.local.u32 [%rd1+120], %r5171; | |
st.local.u32 [%rd1+116], %r148; | |
st.local.u32 [%rd1+124], %r5172; | |
mov.u32 %r4499, %r5172; | |
mov.u32 %r4501, %r5171; | |
mov.u32 %r5172, %r148; | |
mov.u32 %r5171, %r149; | |
mov.u32 %r5173, %r4501; | |
mov.u32 %r5174, %r4499; | |
BB0_56: | |
mov.u32 %r153, %r5171; | |
mov.u32 %r152, %r5172; | |
mov.u32 %r151, %r5173; | |
mov.u32 %r150, %r5174; | |
setp.le.u32 %p29, %r5155, %r153; | |
mov.u32 %r5159, %r153; | |
mov.u32 %r5160, %r152; | |
mov.u32 %r5161, %r151; | |
mov.u32 %r5162, %r150; | |
@%p29 bra BB0_58; | |
st.local.u32 [%rd1+96], %r153; | |
st.local.u32 [%rd1+112], %r5155; | |
st.local.u32 [%rd1+100], %r152; | |
st.local.u32 [%rd1+116], %r5156; | |
st.local.u32 [%rd1+104], %r151; | |
st.local.u32 [%rd1+120], %r5157; | |
st.local.u32 [%rd1+108], %r150; | |
st.local.u32 [%rd1+124], %r5158; | |
mov.u32 %r4489, %r5158; | |
mov.u32 %r4491, %r5157; | |
mov.u32 %r4493, %r5156; | |
mov.u32 %r4495, %r5155; | |
mov.u32 %r5158, %r150; | |
mov.u32 %r5157, %r151; | |
mov.u32 %r5156, %r152; | |
mov.u32 %r5155, %r153; | |
mov.u32 %r5159, %r4495; | |
mov.u32 %r5160, %r4493; | |
mov.u32 %r5161, %r4491; | |
mov.u32 %r5162, %r4489; | |
BB0_58: | |
mov.u32 %r161, %r5155; | |
mov.u32 %r160, %r5156; | |
mov.u32 %r159, %r5157; | |
mov.u32 %r158, %r5158; | |
mov.u32 %r157, %r5159; | |
mov.u32 %r156, %r5160; | |
mov.u32 %r155, %r5161; | |
mov.u32 %r154, %r5162; | |
setp.le.u32 %p30, %r5115, %r161; | |
mov.u32 %r5123, %r161; | |
mov.u32 %r5124, %r160; | |
mov.u32 %r5125, %r159; | |
mov.u32 %r5126, %r158; | |
mov.u32 %r5127, %r157; | |
mov.u32 %r5128, %r156; | |
mov.u32 %r5129, %r155; | |
mov.u32 %r5130, %r154; | |
@%p30 bra BB0_60; | |
st.local.u32 [%rd1+64], %r161; | |
st.local.u32 [%rd1+96], %r5115; | |
st.local.u32 [%rd1+68], %r160; | |
st.local.u32 [%rd1+100], %r5116; | |
st.local.u32 [%rd1+72], %r159; | |
st.local.u32 [%rd1+104], %r5117; | |
st.local.u32 [%rd1+76], %r158; | |
st.local.u32 [%rd1+108], %r5118; | |
st.local.u32 [%rd1+80], %r157; | |
st.local.u32 [%rd1+112], %r5119; | |
st.local.u32 [%rd1+84], %r156; | |
st.local.u32 [%rd1+116], %r5120; | |
st.local.u32 [%rd1+88], %r155; | |
st.local.u32 [%rd1+120], %r5121; | |
st.local.u32 [%rd1+92], %r154; | |
st.local.u32 [%rd1+124], %r5122; | |
mov.u32 %r4461, %r5122; | |
mov.u32 %r4463, %r5121; | |
mov.u32 %r4465, %r5120; | |
mov.u32 %r4467, %r5119; | |
mov.u32 %r4469, %r5118; | |
mov.u32 %r4471, %r5117; | |
mov.u32 %r4473, %r5116; | |
mov.u32 %r4475, %r5115; | |
mov.u32 %r5122, %r154; | |
mov.u32 %r5121, %r155; | |
mov.u32 %r5120, %r156; | |
mov.u32 %r5119, %r157; | |
mov.u32 %r5118, %r158; | |
mov.u32 %r5117, %r159; | |
mov.u32 %r5116, %r160; | |
mov.u32 %r5115, %r161; | |
mov.u32 %r5123, %r4475; | |
mov.u32 %r5124, %r4473; | |
mov.u32 %r5125, %r4471; | |
mov.u32 %r5126, %r4469; | |
mov.u32 %r5127, %r4467; | |
mov.u32 %r5128, %r4465; | |
mov.u32 %r5129, %r4463; | |
mov.u32 %r5130, %r4461; | |
BB0_60: | |
mov.u32 %r177, %r5115; | |
mov.u32 %r176, %r5116; | |
mov.u32 %r175, %r5117; | |
mov.u32 %r174, %r5118; | |
mov.u32 %r173, %r5119; | |
mov.u32 %r172, %r5120; | |
mov.u32 %r171, %r5121; | |
mov.u32 %r170, %r5122; | |
mov.u32 %r169, %r5123; | |
mov.u32 %r168, %r5124; | |
mov.u32 %r167, %r5125; | |
mov.u32 %r166, %r5126; | |
mov.u32 %r165, %r5127; | |
mov.u32 %r164, %r5128; | |
mov.u32 %r163, %r5129; | |
mov.u32 %r162, %r5130; | |
setp.le.u32 %p31, %r5019, %r177; | |
mov.u32 %r5035, %r177; | |
mov.u32 %r5036, %r176; | |
mov.u32 %r5037, %r175; | |
mov.u32 %r5038, %r174; | |
mov.u32 %r5039, %r173; | |
mov.u32 %r5040, %r172; | |
mov.u32 %r5041, %r171; | |
mov.u32 %r5042, %r170; | |
mov.u32 %r5043, %r169; | |
mov.u32 %r5044, %r168; | |
mov.u32 %r5045, %r167; | |
mov.u32 %r5046, %r166; | |
mov.u32 %r5047, %r165; | |
mov.u32 %r5048, %r164; | |
mov.u32 %r5049, %r163; | |
mov.u32 %r5050, %r162; | |
@%p31 bra BB0_62; | |
st.local.u32 [%rd1], %r177; | |
st.local.u32 [%rd1+64], %r5019; | |
st.local.u32 [%rd1+4], %r176; | |
st.local.u32 [%rd1+68], %r5020; | |
st.local.u32 [%rd1+8], %r175; | |
st.local.u32 [%rd1+72], %r5021; | |
st.local.u32 [%rd1+12], %r174; | |
st.local.u32 [%rd1+76], %r5022; | |
st.local.u32 [%rd1+16], %r173; | |
st.local.u32 [%rd1+80], %r5023; | |
st.local.u32 [%rd1+20], %r172; | |
st.local.u32 [%rd1+84], %r5024; | |
st.local.u32 [%rd1+24], %r171; | |
st.local.u32 [%rd1+88], %r5025; | |
st.local.u32 [%rd1+28], %r170; | |
st.local.u32 [%rd1+92], %r5026; | |
st.local.u32 [%rd1+32], %r169; | |
st.local.u32 [%rd1+96], %r5027; | |
st.local.u32 [%rd1+36], %r168; | |
st.local.u32 [%rd1+100], %r5028; | |
st.local.u32 [%rd1+40], %r167; | |
st.local.u32 [%rd1+104], %r5029; | |
st.local.u32 [%rd1+44], %r166; | |
st.local.u32 [%rd1+108], %r5030; | |
st.local.u32 [%rd1+48], %r165; | |
st.local.u32 [%rd1+112], %r5031; | |
st.local.u32 [%rd1+52], %r164; | |
st.local.u32 [%rd1+116], %r5032; | |
st.local.u32 [%rd1+56], %r163; | |
st.local.u32 [%rd1+120], %r5033; | |
st.local.u32 [%rd1+60], %r162; | |
st.local.u32 [%rd1+124], %r5034; | |
mov.u32 %r4389, %r5034; | |
mov.u32 %r4391, %r5033; | |
mov.u32 %r4393, %r5032; | |
mov.u32 %r4395, %r5031; | |
mov.u32 %r4397, %r5030; | |
mov.u32 %r4399, %r5029; | |
mov.u32 %r4401, %r5028; | |
mov.u32 %r4403, %r5027; | |
mov.u32 %r4405, %r5026; | |
mov.u32 %r4407, %r5025; | |
mov.u32 %r4409, %r5024; | |
mov.u32 %r4411, %r5023; | |
mov.u32 %r4413, %r5022; | |
mov.u32 %r4415, %r5021; | |
mov.u32 %r4417, %r5020; | |
mov.u32 %r4419, %r5019; | |
mov.u32 %r5034, %r162; | |
mov.u32 %r5033, %r163; | |
mov.u32 %r5032, %r164; | |
mov.u32 %r5031, %r165; | |
mov.u32 %r5030, %r166; | |
mov.u32 %r5029, %r167; | |
mov.u32 %r5028, %r168; | |
mov.u32 %r5027, %r169; | |
mov.u32 %r5026, %r170; | |
mov.u32 %r5025, %r171; | |
mov.u32 %r5024, %r172; | |
mov.u32 %r5023, %r173; | |
mov.u32 %r5022, %r174; | |
mov.u32 %r5021, %r175; | |
mov.u32 %r5020, %r176; | |
mov.u32 %r5019, %r177; | |
mov.u32 %r5035, %r4419; | |
mov.u32 %r5036, %r4417; | |
mov.u32 %r5037, %r4415; | |
mov.u32 %r5038, %r4413; | |
mov.u32 %r5039, %r4411; | |
mov.u32 %r5040, %r4409; | |
mov.u32 %r5041, %r4407; | |
mov.u32 %r5042, %r4405; | |
mov.u32 %r5043, %r4403; | |
mov.u32 %r5044, %r4401; | |
mov.u32 %r5045, %r4399; | |
mov.u32 %r5046, %r4397; | |
mov.u32 %r5047, %r4395; | |
mov.u32 %r5048, %r4393; | |
mov.u32 %r5049, %r4391; | |
mov.u32 %r5050, %r4389; | |
BB0_62: | |
mov.u32 %r209, %r5019; | |
bfe.u32 %r1753, %r2, 22, 6; | |
mul.wide.u32 %rd370, %r1753, 28; | |
add.s64 %rd371, %rd148, %rd370; | |
ld.global.u32 %r210, [%rd371+4]; | |
and.b32 %r1754, %r210, 65535; | |
mul.wide.u32 %rd372, %r1754, 1792; | |
add.s64 %rd373, %rd3, %rd372; | |
bfe.u32 %r1755, %r210, 16, 6; | |
mul.wide.u32 %rd374, %r1755, 28; | |
add.s64 %rd375, %rd373, %rd374; | |
ld.global.u32 %r211, [%rd375+-4]; | |
and.b32 %r1756, %r211, 65535; | |
bfe.u32 %r1757, %r211, 16, 6; | |
mul.wide.u32 %rd376, %r1756, 1792; | |
add.s64 %rd377, %rd146, %rd376; | |
mul.wide.u32 %rd378, %r1757, 28; | |
add.s64 %rd379, %rd377, %rd378; | |
ld.global.u32 %r212, [%rd379]; | |
and.b32 %r1758, %r212, 65535; | |
mul.wide.u32 %rd380, %r1758, 1792; | |
add.s64 %rd381, %rd3, %rd380; | |
cvt.u64.u32 %rd16, %r1754; | |
cvt.u64.u32 %rd17, %r1756; | |
cvt.u64.u32 %rd18, %r1758; | |
bfe.u32 %r1759, %r212, 16, 6; | |
mul.wide.u32 %rd382, %r1759, 28; | |
add.s64 %rd383, %rd381, %rd382; | |
ld.global.u32 %r213, [%rd383+-8]; | |
and.b32 %r1760, %r213, 65535; | |
cvt.u64.u32 %rd19, %r1760; | |
bfe.u32 %r1761, %r213, 16, 6; | |
mul.wide.u32 %rd384, %r1760, 1792; | |
add.s64 %rd385, %rd136, %rd384; | |
mul.wide.u32 %rd386, %r1761, 28; | |
add.s64 %rd387, %rd385, %rd386; | |
ld.global.u32 %r1762, [%rd387]; | |
and.b32 %r1763, %r1762, 65535; | |
bfe.u32 %r1764, %r1762, 16, 6; | |
mul.wide.u32 %rd388, %r1763, 1792; | |
add.s64 %rd389, %rd135, %rd388; | |
mul.wide.u32 %rd390, %r1764, 28; | |
add.s64 %rd391, %rd389, %rd390; | |
ld.global.u32 %r1765, [%rd391]; | |
and.b32 %r1766, %r1765, 65535; | |
shl.b32 %r1767, %r1766, 6; | |
bfe.u32 %r1768, %r1765, 16, 6; | |
or.b32 %r214, %r1767, %r1768; | |
st.local.u32 [%rd1+128], %r214; | |
bfe.u32 %r1769, %r1762, 22, 6; | |
mul.wide.u32 %rd392, %r1769, 28; | |
add.s64 %rd393, %rd389, %rd392; | |
ld.global.u32 %r1770, [%rd393]; | |
and.b32 %r1771, %r1770, 65535; | |
shl.b32 %r1772, %r1771, 6; | |
bfe.u32 %r1773, %r1770, 16, 6; | |
or.b32 %r4920, %r1772, %r1773; | |
st.local.u32 [%rd1+132], %r4920; | |
setp.le.u32 %p32, %r214, %r4920; | |
mov.u32 %r4919, %r214; | |
@%p32 bra BB0_64; | |
st.local.u32 [%rd1+128], %r4920; | |
st.local.u32 [%rd1+132], %r214; | |
mov.u32 %r4565, %r4920; | |
mov.u32 %r4920, %r214; | |
mov.u32 %r4919, %r4565; | |
BB0_64: | |
mov.u32 %r4915, %r4919; | |
mov.u32 %r4916, %r4920; | |
bfe.u32 %r1774, %r213, 22, 6; | |
mul.lo.s64 %rd394, %rd19, 1792; | |
add.s64 %rd395, %rd136, %rd394; | |
mul.wide.u32 %rd396, %r1774, 28; | |
add.s64 %rd397, %rd395, %rd396; | |
ld.global.u32 %r1775, [%rd397]; | |
and.b32 %r1776, %r1775, 65535; | |
bfe.u32 %r1777, %r1775, 16, 6; | |
mul.wide.u32 %rd398, %r1776, 1792; | |
add.s64 %rd399, %rd135, %rd398; | |
mul.wide.u32 %rd400, %r1777, 28; | |
add.s64 %rd401, %rd399, %rd400; | |
ld.global.u32 %r1778, [%rd401]; | |
and.b32 %r1779, %r1778, 65535; | |
shl.b32 %r1780, %r1779, 6; | |
bfe.u32 %r1781, %r1778, 16, 6; | |
or.b32 %r218, %r1780, %r1781; | |
st.local.u32 [%rd1+136], %r218; | |
bfe.u32 %r1782, %r1775, 22, 6; | |
mul.wide.u32 %rd402, %r1782, 28; | |
add.s64 %rd403, %rd399, %rd402; | |
ld.global.u32 %r1783, [%rd403]; | |
and.b32 %r1784, %r1783, 65535; | |
shl.b32 %r1785, %r1784, 6; | |
bfe.u32 %r1786, %r1783, 16, 6; | |
or.b32 %r4922, %r1785, %r1786; | |
st.local.u32 [%rd1+140], %r4922; | |
setp.le.u32 %p33, %r218, %r4922; | |
mov.u32 %r4921, %r218; | |
@%p33 bra BB0_66; | |
st.local.u32 [%rd1+136], %r4922; | |
st.local.u32 [%rd1+140], %r218; | |
mov.u32 %r4571, %r4922; | |
mov.u32 %r4922, %r218; | |
mov.u32 %r4921, %r4571; | |
BB0_66: | |
mov.u32 %r221, %r4921; | |
mov.u32 %r220, %r4922; | |
setp.le.u32 %p34, %r4915, %r221; | |
mov.u32 %r4917, %r221; | |
mov.u32 %r4918, %r220; | |
@%p34 bra BB0_68; | |
st.local.u32 [%rd1+128], %r221; | |
st.local.u32 [%rd1+136], %r4915; | |
st.local.u32 [%rd1+132], %r220; | |
st.local.u32 [%rd1+140], %r4916; | |
mov.u32 %r4568, %r4916; | |
mov.u32 %r4570, %r4915; | |
mov.u32 %r4916, %r220; | |
mov.u32 %r4915, %r221; | |
mov.u32 %r4917, %r4570; | |
mov.u32 %r4918, %r4568; | |
BB0_68: | |
mov.u32 %r4907, %r4915; | |
mov.u32 %r4908, %r4916; | |
mov.u32 %r4909, %r4917; | |
mov.u32 %r4910, %r4918; | |
mul.lo.s64 %rd404, %rd18, 1792; | |
add.s64 %rd405, %rd3, %rd404; | |
bfe.u32 %r1787, %r212, 22, 6; | |
mul.wide.u32 %rd406, %r1787, 28; | |
add.s64 %rd407, %rd405, %rd406; | |
ld.global.u32 %r226, [%rd407+-8]; | |
and.b32 %r1788, %r226, 65535; | |
cvt.u64.u32 %rd20, %r1788; | |
bfe.u32 %r1789, %r226, 16, 6; | |
mul.wide.u32 %rd408, %r1788, 1792; | |
add.s64 %rd409, %rd136, %rd408; | |
mul.wide.u32 %rd410, %r1789, 28; | |
add.s64 %rd411, %rd409, %rd410; | |
ld.global.u32 %r1790, [%rd411]; | |
and.b32 %r1791, %r1790, 65535; | |
bfe.u32 %r1792, %r1790, 16, 6; | |
mul.wide.u32 %rd412, %r1791, 1792; | |
add.s64 %rd413, %rd135, %rd412; | |
mul.wide.u32 %rd414, %r1792, 28; | |
add.s64 %rd415, %rd413, %rd414; | |
ld.global.u32 %r1793, [%rd415]; | |
and.b32 %r1794, %r1793, 65535; | |
shl.b32 %r1795, %r1794, 6; | |
bfe.u32 %r1796, %r1793, 16, 6; | |
or.b32 %r227, %r1795, %r1796; | |
st.local.u32 [%rd1+144], %r227; | |
bfe.u32 %r1797, %r1790, 22, 6; | |
mul.wide.u32 %rd416, %r1797, 28; | |
add.s64 %rd417, %rd413, %rd416; | |
ld.global.u32 %r1798, [%rd417]; | |
and.b32 %r1799, %r1798, 65535; | |
shl.b32 %r1800, %r1799, 6; | |
bfe.u32 %r1801, %r1798, 16, 6; | |
or.b32 %r4928, %r1800, %r1801; | |
st.local.u32 [%rd1+148], %r4928; | |
setp.le.u32 %p35, %r227, %r4928; | |
mov.u32 %r4927, %r227; | |
@%p35 bra BB0_70; | |
st.local.u32 [%rd1+144], %r4928; | |
st.local.u32 [%rd1+148], %r227; | |
mov.u32 %r4585, %r4928; | |
mov.u32 %r4928, %r227; | |
mov.u32 %r4927, %r4585; | |
BB0_70: | |
mov.u32 %r4923, %r4927; | |
mov.u32 %r4924, %r4928; | |
bfe.u32 %r1802, %r226, 22, 6; | |
mul.lo.s64 %rd418, %rd20, 1792; | |
add.s64 %rd419, %rd136, %rd418; | |
mul.wide.u32 %rd420, %r1802, 28; | |
add.s64 %rd421, %rd419, %rd420; | |
ld.global.u32 %r1803, [%rd421]; | |
and.b32 %r1804, %r1803, 65535; | |
bfe.u32 %r1805, %r1803, 16, 6; | |
mul.wide.u32 %rd422, %r1804, 1792; | |
add.s64 %rd423, %rd135, %rd422; | |
mul.wide.u32 %rd424, %r1805, 28; | |
add.s64 %rd425, %rd423, %rd424; | |
ld.global.u32 %r1806, [%rd425]; | |
and.b32 %r1807, %r1806, 65535; | |
shl.b32 %r1808, %r1807, 6; | |
bfe.u32 %r1809, %r1806, 16, 6; | |
or.b32 %r231, %r1808, %r1809; | |
st.local.u32 [%rd1+152], %r231; | |
bfe.u32 %r1810, %r1803, 22, 6; | |
mul.wide.u32 %rd426, %r1810, 28; | |
add.s64 %rd427, %rd423, %rd426; | |
ld.global.u32 %r1811, [%rd427]; | |
and.b32 %r1812, %r1811, 65535; | |
shl.b32 %r1813, %r1812, 6; | |
bfe.u32 %r1814, %r1811, 16, 6; | |
or.b32 %r4930, %r1813, %r1814; | |
st.local.u32 [%rd1+156], %r4930; | |
setp.le.u32 %p36, %r231, %r4930; | |
mov.u32 %r4929, %r231; | |
@%p36 bra BB0_72; | |
st.local.u32 [%rd1+152], %r4930; | |
st.local.u32 [%rd1+156], %r231; | |
mov.u32 %r4591, %r4930; | |
mov.u32 %r4930, %r231; | |
mov.u32 %r4929, %r4591; | |
BB0_72: | |
mov.u32 %r234, %r4929; | |
mov.u32 %r233, %r4930; | |
setp.le.u32 %p37, %r4923, %r234; | |
mov.u32 %r4925, %r234; | |
mov.u32 %r4926, %r233; | |
@%p37 bra BB0_74; | |
st.local.u32 [%rd1+144], %r234; | |
st.local.u32 [%rd1+152], %r4923; | |
st.local.u32 [%rd1+148], %r233; | |
st.local.u32 [%rd1+156], %r4924; | |
mov.u32 %r4588, %r4924; | |
mov.u32 %r4590, %r4923; | |
mov.u32 %r4924, %r233; | |
mov.u32 %r4923, %r234; | |
mov.u32 %r4925, %r4590; | |
mov.u32 %r4926, %r4588; | |
BB0_74: | |
mov.u32 %r238, %r4923; | |
mov.u32 %r237, %r4924; | |
mov.u32 %r236, %r4925; | |
mov.u32 %r235, %r4926; | |
setp.le.u32 %p38, %r4907, %r238; | |
mov.u32 %r4911, %r238; | |
mov.u32 %r4912, %r237; | |
mov.u32 %r4913, %r236; | |
mov.u32 %r4914, %r235; | |
@%p38 bra BB0_76; | |
st.local.u32 [%rd1+128], %r238; | |
st.local.u32 [%rd1+144], %r4907; | |
st.local.u32 [%rd1+132], %r237; | |
st.local.u32 [%rd1+148], %r4908; | |
st.local.u32 [%rd1+136], %r236; | |
st.local.u32 [%rd1+152], %r4909; | |
st.local.u32 [%rd1+140], %r235; | |
st.local.u32 [%rd1+156], %r4910; | |
mov.u32 %r4578, %r4910; | |
mov.u32 %r4580, %r4909; | |
mov.u32 %r4582, %r4908; | |
mov.u32 %r4584, %r4907; | |
mov.u32 %r4910, %r235; | |
mov.u32 %r4909, %r236; | |
mov.u32 %r4908, %r237; | |
mov.u32 %r4907, %r238; | |
mov.u32 %r4911, %r4584; | |
mov.u32 %r4912, %r4582; | |
mov.u32 %r4913, %r4580; | |
mov.u32 %r4914, %r4578; | |
BB0_76: | |
mov.u32 %r4891, %r4907; | |
mov.u32 %r4892, %r4908; | |
mov.u32 %r4893, %r4909; | |
mov.u32 %r4894, %r4910; | |
mov.u32 %r4895, %r4911; | |
mov.u32 %r4896, %r4912; | |
mov.u32 %r4897, %r4913; | |
mov.u32 %r4898, %r4914; | |
mul.lo.s64 %rd428, %rd17, 1792; | |
add.s64 %rd429, %rd136, %rd428; | |
bfe.u32 %r1815, %r211, 22, 6; | |
mul.wide.u32 %rd430, %r1815, 28; | |
add.s64 %rd431, %rd429, %rd430; | |
ld.global.u32 %r247, [%rd431+4]; | |
and.b32 %r1816, %r247, 65535; | |
mul.wide.u32 %rd432, %r1816, 1792; | |
add.s64 %rd433, %rd3, %rd432; | |
cvt.u64.u32 %rd21, %r1816; | |
bfe.u32 %r1817, %r247, 16, 6; | |
mul.wide.u32 %rd434, %r1817, 28; | |
add.s64 %rd435, %rd433, %rd434; | |
ld.global.u32 %r248, [%rd435+-8]; | |
and.b32 %r1818, %r248, 65535; | |
cvt.u64.u32 %rd22, %r1818; | |
bfe.u32 %r1819, %r248, 16, 6; | |
mul.wide.u32 %rd436, %r1818, 1792; | |
add.s64 %rd437, %rd136, %rd436; | |
mul.wide.u32 %rd438, %r1819, 28; | |
add.s64 %rd439, %rd437, %rd438; | |
ld.global.u32 %r1820, [%rd439]; | |
and.b32 %r1821, %r1820, 65535; | |
bfe.u32 %r1822, %r1820, 16, 6; | |
mul.wide.u32 %rd440, %r1821, 1792; | |
add.s64 %rd441, %rd135, %rd440; | |
mul.wide.u32 %rd442, %r1822, 28; | |
add.s64 %rd443, %rd441, %rd442; | |
ld.global.u32 %r1823, [%rd443]; | |
and.b32 %r1824, %r1823, 65535; | |
shl.b32 %r1825, %r1824, 6; | |
bfe.u32 %r1826, %r1823, 16, 6; | |
or.b32 %r249, %r1825, %r1826; | |
st.local.u32 [%rd1+160], %r249; | |
bfe.u32 %r1827, %r1820, 22, 6; | |
mul.wide.u32 %rd444, %r1827, 28; | |
add.s64 %rd445, %rd441, %rd444; | |
ld.global.u32 %r1828, [%rd445]; | |
and.b32 %r1829, %r1828, 65535; | |
shl.b32 %r1830, %r1829, 6; | |
bfe.u32 %r1831, %r1828, 16, 6; | |
or.b32 %r4944, %r1830, %r1831; | |
st.local.u32 [%rd1+164], %r4944; | |
setp.le.u32 %p39, %r249, %r4944; | |
mov.u32 %r4943, %r249; | |
@%p39 bra BB0_78; | |
st.local.u32 [%rd1+160], %r4944; | |
st.local.u32 [%rd1+164], %r249; | |
mov.u32 %r4621, %r4944; | |
mov.u32 %r4944, %r249; | |
mov.u32 %r4943, %r4621; | |
BB0_78: | |
mov.u32 %r4939, %r4943; | |
mov.u32 %r4940, %r4944; | |
bfe.u32 %r1832, %r248, 22, 6; | |
mul.lo.s64 %rd446, %rd22, 1792; | |
add.s64 %rd447, %rd136, %rd446; | |
mul.wide.u32 %rd448, %r1832, 28; | |
add.s64 %rd449, %rd447, %rd448; | |
ld.global.u32 %r1833, [%rd449]; | |
and.b32 %r1834, %r1833, 65535; | |
bfe.u32 %r1835, %r1833, 16, 6; | |
mul.wide.u32 %rd450, %r1834, 1792; | |
add.s64 %rd451, %rd135, %rd450; | |
mul.wide.u32 %rd452, %r1835, 28; | |
add.s64 %rd453, %rd451, %rd452; | |
ld.global.u32 %r1836, [%rd453]; | |
and.b32 %r1837, %r1836, 65535; | |
shl.b32 %r1838, %r1837, 6; | |
bfe.u32 %r1839, %r1836, 16, 6; | |
or.b32 %r253, %r1838, %r1839; | |
st.local.u32 [%rd1+168], %r253; | |
bfe.u32 %r1840, %r1833, 22, 6; | |
mul.wide.u32 %rd454, %r1840, 28; | |
add.s64 %rd455, %rd451, %rd454; | |
ld.global.u32 %r1841, [%rd455]; | |
and.b32 %r1842, %r1841, 65535; | |
shl.b32 %r1843, %r1842, 6; | |
bfe.u32 %r1844, %r1841, 16, 6; | |
or.b32 %r4946, %r1843, %r1844; | |
st.local.u32 [%rd1+172], %r4946; | |
setp.le.u32 %p40, %r253, %r4946; | |
mov.u32 %r4945, %r253; | |
@%p40 bra BB0_80; | |
st.local.u32 [%rd1+168], %r4946; | |
st.local.u32 [%rd1+172], %r253; | |
mov.u32 %r4627, %r4946; | |
mov.u32 %r4946, %r253; | |
mov.u32 %r4945, %r4627; | |
BB0_80: | |
mov.u32 %r256, %r4945; | |
mov.u32 %r255, %r4946; | |
setp.le.u32 %p41, %r4939, %r256; | |
mov.u32 %r4941, %r256; | |
mov.u32 %r4942, %r255; | |
@%p41 bra BB0_82; | |
st.local.u32 [%rd1+160], %r256; | |
st.local.u32 [%rd1+168], %r4939; | |
st.local.u32 [%rd1+164], %r255; | |
st.local.u32 [%rd1+172], %r4940; | |
mov.u32 %r4624, %r4940; | |
mov.u32 %r4626, %r4939; | |
mov.u32 %r4940, %r255; | |
mov.u32 %r4939, %r256; | |
mov.u32 %r4941, %r4626; | |
mov.u32 %r4942, %r4624; | |
BB0_82: | |
mov.u32 %r4931, %r4939; | |
mov.u32 %r4932, %r4940; | |
mov.u32 %r4933, %r4941; | |
mov.u32 %r4934, %r4942; | |
mul.lo.s64 %rd456, %rd21, 1792; | |
add.s64 %rd457, %rd3, %rd456; | |
bfe.u32 %r1845, %r247, 22, 6; | |
mul.wide.u32 %rd458, %r1845, 28; | |
add.s64 %rd459, %rd457, %rd458; | |
ld.global.u32 %r261, [%rd459+-8]; | |
and.b32 %r1846, %r261, 65535; | |
cvt.u64.u32 %rd23, %r1846; | |
bfe.u32 %r1847, %r261, 16, 6; | |
mul.wide.u32 %rd460, %r1846, 1792; | |
add.s64 %rd461, %rd136, %rd460; | |
mul.wide.u32 %rd462, %r1847, 28; | |
add.s64 %rd463, %rd461, %rd462; | |
ld.global.u32 %r1848, [%rd463]; | |
and.b32 %r1849, %r1848, 65535; | |
bfe.u32 %r1850, %r1848, 16, 6; | |
mul.wide.u32 %rd464, %r1849, 1792; | |
add.s64 %rd465, %rd135, %rd464; | |
mul.wide.u32 %rd466, %r1850, 28; | |
add.s64 %rd467, %rd465, %rd466; | |
ld.global.u32 %r1851, [%rd467]; | |
and.b32 %r1852, %r1851, 65535; | |
shl.b32 %r1853, %r1852, 6; | |
bfe.u32 %r1854, %r1851, 16, 6; | |
or.b32 %r262, %r1853, %r1854; | |
st.local.u32 [%rd1+176], %r262; | |
bfe.u32 %r1855, %r1848, 22, 6; | |
mul.wide.u32 %rd468, %r1855, 28; | |
add.s64 %rd469, %rd465, %rd468; | |
ld.global.u32 %r1856, [%rd469]; | |
and.b32 %r1857, %r1856, 65535; | |
shl.b32 %r1858, %r1857, 6; | |
bfe.u32 %r1859, %r1856, 16, 6; | |
or.b32 %r4952, %r1858, %r1859; | |
st.local.u32 [%rd1+180], %r4952; | |
setp.le.u32 %p42, %r262, %r4952; | |
mov.u32 %r4951, %r262; | |
@%p42 bra BB0_84; | |
st.local.u32 [%rd1+176], %r4952; | |
st.local.u32 [%rd1+180], %r262; | |
mov.u32 %r4641, %r4952; | |
mov.u32 %r4952, %r262; | |
mov.u32 %r4951, %r4641; | |
BB0_84: | |
mov.u32 %r4947, %r4951; | |
mov.u32 %r4948, %r4952; | |
bfe.u32 %r1860, %r261, 22, 6; | |
mul.lo.s64 %rd470, %rd23, 1792; | |
add.s64 %rd471, %rd136, %rd470; | |
mul.wide.u32 %rd472, %r1860, 28; | |
add.s64 %rd473, %rd471, %rd472; | |
ld.global.u32 %r1861, [%rd473]; | |
and.b32 %r1862, %r1861, 65535; | |
bfe.u32 %r1863, %r1861, 16, 6; | |
mul.wide.u32 %rd474, %r1862, 1792; | |
add.s64 %rd475, %rd135, %rd474; | |
mul.wide.u32 %rd476, %r1863, 28; | |
add.s64 %rd477, %rd475, %rd476; | |
ld.global.u32 %r1864, [%rd477]; | |
and.b32 %r1865, %r1864, 65535; | |
shl.b32 %r1866, %r1865, 6; | |
bfe.u32 %r1867, %r1864, 16, 6; | |
or.b32 %r266, %r1866, %r1867; | |
st.local.u32 [%rd1+184], %r266; | |
bfe.u32 %r1868, %r1861, 22, 6; | |
mul.wide.u32 %rd478, %r1868, 28; | |
add.s64 %rd479, %rd475, %rd478; | |
ld.global.u32 %r1869, [%rd479]; | |
and.b32 %r1870, %r1869, 65535; | |
shl.b32 %r1871, %r1870, 6; | |
bfe.u32 %r1872, %r1869, 16, 6; | |
or.b32 %r4954, %r1871, %r1872; | |
st.local.u32 [%rd1+188], %r4954; | |
setp.le.u32 %p43, %r266, %r4954; | |
mov.u32 %r4953, %r266; | |
@%p43 bra BB0_86; | |
st.local.u32 [%rd1+184], %r4954; | |
st.local.u32 [%rd1+188], %r266; | |
mov.u32 %r4647, %r4954; | |
mov.u32 %r4954, %r266; | |
mov.u32 %r4953, %r4647; | |
BB0_86: | |
mov.u32 %r269, %r4953; | |
mov.u32 %r268, %r4954; | |
setp.le.u32 %p44, %r4947, %r269; | |
mov.u32 %r4949, %r269; | |
mov.u32 %r4950, %r268; | |
@%p44 bra BB0_88; | |
st.local.u32 [%rd1+176], %r269; | |
st.local.u32 [%rd1+184], %r4947; | |
st.local.u32 [%rd1+180], %r268; | |
st.local.u32 [%rd1+188], %r4948; | |
mov.u32 %r4644, %r4948; | |
mov.u32 %r4646, %r4947; | |
mov.u32 %r4948, %r268; | |
mov.u32 %r4947, %r269; | |
mov.u32 %r4949, %r4646; | |
mov.u32 %r4950, %r4644; | |
BB0_88: | |
mov.u32 %r273, %r4947; | |
mov.u32 %r272, %r4948; | |
mov.u32 %r271, %r4949; | |
mov.u32 %r270, %r4950; | |
setp.le.u32 %p45, %r4931, %r273; | |
mov.u32 %r4935, %r273; | |
mov.u32 %r4936, %r272; | |
mov.u32 %r4937, %r271; | |
mov.u32 %r4938, %r270; | |
@%p45 bra BB0_90; | |
st.local.u32 [%rd1+160], %r273; | |
st.local.u32 [%rd1+176], %r4931; | |
st.local.u32 [%rd1+164], %r272; | |
st.local.u32 [%rd1+180], %r4932; | |
st.local.u32 [%rd1+168], %r271; | |
st.local.u32 [%rd1+184], %r4933; | |
st.local.u32 [%rd1+172], %r270; | |
st.local.u32 [%rd1+188], %r4934; | |
mov.u32 %r4634, %r4934; | |
mov.u32 %r4636, %r4933; | |
mov.u32 %r4638, %r4932; | |
mov.u32 %r4640, %r4931; | |
mov.u32 %r4934, %r270; | |
mov.u32 %r4933, %r271; | |
mov.u32 %r4932, %r272; | |
mov.u32 %r4931, %r273; | |
mov.u32 %r4935, %r4640; | |
mov.u32 %r4936, %r4638; | |
mov.u32 %r4937, %r4636; | |
mov.u32 %r4938, %r4634; | |
BB0_90: | |
mov.u32 %r281, %r4931; | |
mov.u32 %r280, %r4932; | |
mov.u32 %r279, %r4933; | |
mov.u32 %r278, %r4934; | |
mov.u32 %r277, %r4935; | |
mov.u32 %r276, %r4936; | |
mov.u32 %r275, %r4937; | |
mov.u32 %r274, %r4938; | |
setp.le.u32 %p46, %r4891, %r281; | |
mov.u32 %r4899, %r281; | |
mov.u32 %r4900, %r280; | |
mov.u32 %r4901, %r279; | |
mov.u32 %r4902, %r278; | |
mov.u32 %r4903, %r277; | |
mov.u32 %r4904, %r276; | |
mov.u32 %r4905, %r275; | |
mov.u32 %r4906, %r274; | |
@%p46 bra BB0_92; | |
st.local.u32 [%rd1+128], %r281; | |
st.local.u32 [%rd1+160], %r4891; | |
st.local.u32 [%rd1+132], %r280; | |
st.local.u32 [%rd1+164], %r4892; | |
st.local.u32 [%rd1+136], %r279; | |
st.local.u32 [%rd1+168], %r4893; | |
st.local.u32 [%rd1+140], %r278; | |
st.local.u32 [%rd1+172], %r4894; | |
st.local.u32 [%rd1+144], %r277; | |
st.local.u32 [%rd1+176], %r4895; | |
st.local.u32 [%rd1+148], %r276; | |
st.local.u32 [%rd1+180], %r4896; | |
st.local.u32 [%rd1+152], %r275; | |
st.local.u32 [%rd1+184], %r4897; | |
st.local.u32 [%rd1+156], %r274; | |
st.local.u32 [%rd1+188], %r4898; | |
mov.u32 %r4606, %r4898; | |
mov.u32 %r4608, %r4897; | |
mov.u32 %r4610, %r4896; | |
mov.u32 %r4612, %r4895; | |
mov.u32 %r4614, %r4894; | |
mov.u32 %r4616, %r4893; | |
mov.u32 %r4618, %r4892; | |
mov.u32 %r4620, %r4891; | |
mov.u32 %r4898, %r274; | |
mov.u32 %r4897, %r275; | |
mov.u32 %r4896, %r276; | |
mov.u32 %r4895, %r277; | |
mov.u32 %r4894, %r278; | |
mov.u32 %r4893, %r279; | |
mov.u32 %r4892, %r280; | |
mov.u32 %r4891, %r281; | |
mov.u32 %r4899, %r4620; | |
mov.u32 %r4900, %r4618; | |
mov.u32 %r4901, %r4616; | |
mov.u32 %r4902, %r4614; | |
mov.u32 %r4903, %r4612; | |
mov.u32 %r4904, %r4610; | |
mov.u32 %r4905, %r4608; | |
mov.u32 %r4906, %r4606; | |
BB0_92: | |
mov.u32 %r4859, %r4891; | |
mov.u32 %r4860, %r4892; | |
mov.u32 %r4861, %r4893; | |
mov.u32 %r4862, %r4894; | |
mov.u32 %r4863, %r4895; | |
mov.u32 %r4864, %r4896; | |
mov.u32 %r4865, %r4897; | |
mov.u32 %r4866, %r4898; | |
mov.u32 %r4867, %r4899; | |
mov.u32 %r4868, %r4900; | |
mov.u32 %r4869, %r4901; | |
mov.u32 %r4870, %r4902; | |
mov.u32 %r4871, %r4903; | |
mov.u32 %r4872, %r4904; | |
mov.u32 %r4873, %r4905; | |
mov.u32 %r4874, %r4906; | |
mul.lo.s64 %rd480, %rd16, 1792; | |
add.s64 %rd481, %rd3, %rd480; | |
bfe.u32 %r1873, %r210, 22, 6; | |
mul.wide.u32 %rd482, %r1873, 28; | |
add.s64 %rd483, %rd481, %rd482; | |
ld.global.u32 %r298, [%rd483+-4]; | |
and.b32 %r1874, %r298, 65535; | |
mul.wide.u32 %rd484, %r1874, 1792; | |
add.s64 %rd485, %rd136, %rd484; | |
bfe.u32 %r1875, %r298, 16, 6; | |
mul.wide.u32 %rd486, %r1875, 28; | |
add.s64 %rd487, %rd485, %rd486; | |
ld.global.u32 %r299, [%rd487+4]; | |
and.b32 %r1876, %r299, 65535; | |
mul.wide.u32 %rd488, %r1876, 1792; | |
add.s64 %rd489, %rd3, %rd488; | |
cvt.u64.u32 %rd24, %r1874; | |
cvt.u64.u32 %rd25, %r1876; | |
bfe.u32 %r1877, %r299, 16, 6; | |
mul.wide.u32 %rd490, %r1877, 28; | |
add.s64 %rd491, %rd489, %rd490; | |
ld.global.u32 %r300, [%rd491+-8]; | |
and.b32 %r1878, %r300, 65535; | |
cvt.u64.u32 %rd26, %r1878; | |
bfe.u32 %r1879, %r300, 16, 6; | |
mul.wide.u32 %rd492, %r1878, 1792; | |
add.s64 %rd493, %rd136, %rd492; | |
mul.wide.u32 %rd494, %r1879, 28; | |
add.s64 %rd495, %rd493, %rd494; | |
ld.global.u32 %r1880, [%rd495]; | |
and.b32 %r1881, %r1880, 65535; | |
bfe.u32 %r1882, %r1880, 16, 6; | |
mul.wide.u32 %rd496, %r1881, 1792; | |
add.s64 %rd497, %rd135, %rd496; | |
mul.wide.u32 %rd498, %r1882, 28; | |
add.s64 %rd499, %rd497, %rd498; | |
ld.global.u32 %r1883, [%rd499]; | |
and.b32 %r1884, %r1883, 65535; | |
shl.b32 %r1885, %r1884, 6; | |
bfe.u32 %r1886, %r1883, 16, 6; | |
or.b32 %r301, %r1885, %r1886; | |
st.local.u32 [%rd1+192], %r301; | |
bfe.u32 %r1887, %r1880, 22, 6; | |
mul.wide.u32 %rd500, %r1887, 28; | |
add.s64 %rd501, %rd497, %rd500; | |
ld.global.u32 %r1888, [%rd501]; | |
and.b32 %r1889, %r1888, 65535; | |
shl.b32 %r1890, %r1889, 6; | |
bfe.u32 %r1891, %r1888, 16, 6; | |
or.b32 %r4984, %r1890, %r1891; | |
st.local.u32 [%rd1+196], %r4984; | |
setp.le.u32 %p47, %r301, %r4984; | |
mov.u32 %r4983, %r301; | |
@%p47 bra BB0_94; | |
st.local.u32 [%rd1+192], %r4984; | |
st.local.u32 [%rd1+196], %r301; | |
mov.u32 %r4709, %r4984; | |
mov.u32 %r4984, %r301; | |
mov.u32 %r4983, %r4709; | |
BB0_94: | |
mov.u32 %r4979, %r4983; | |
mov.u32 %r4980, %r4984; | |
bfe.u32 %r1892, %r300, 22, 6; | |
mul.lo.s64 %rd502, %rd26, 1792; | |
add.s64 %rd503, %rd136, %rd502; | |
mul.wide.u32 %rd504, %r1892, 28; | |
add.s64 %rd505, %rd503, %rd504; | |
ld.global.u32 %r1893, [%rd505]; | |
and.b32 %r1894, %r1893, 65535; | |
bfe.u32 %r1895, %r1893, 16, 6; | |
mul.wide.u32 %rd506, %r1894, 1792; | |
add.s64 %rd507, %rd135, %rd506; | |
mul.wide.u32 %rd508, %r1895, 28; | |
add.s64 %rd509, %rd507, %rd508; | |
ld.global.u32 %r1896, [%rd509]; | |
and.b32 %r1897, %r1896, 65535; | |
shl.b32 %r1898, %r1897, 6; | |
bfe.u32 %r1899, %r1896, 16, 6; | |
or.b32 %r305, %r1898, %r1899; | |
st.local.u32 [%rd1+200], %r305; | |
bfe.u32 %r1900, %r1893, 22, 6; | |
mul.wide.u32 %rd510, %r1900, 28; | |
add.s64 %rd511, %rd507, %rd510; | |
ld.global.u32 %r1901, [%rd511]; | |
and.b32 %r1902, %r1901, 65535; | |
shl.b32 %r1903, %r1902, 6; | |
bfe.u32 %r1904, %r1901, 16, 6; | |
or.b32 %r4986, %r1903, %r1904; | |
st.local.u32 [%rd1+204], %r4986; | |
setp.le.u32 %p48, %r305, %r4986; | |
mov.u32 %r4985, %r305; | |
@%p48 bra BB0_96; | |
st.local.u32 [%rd1+200], %r4986; | |
st.local.u32 [%rd1+204], %r305; | |
mov.u32 %r4715, %r4986; | |
mov.u32 %r4986, %r305; | |
mov.u32 %r4985, %r4715; | |
BB0_96: | |
mov.u32 %r308, %r4985; | |
mov.u32 %r307, %r4986; | |
setp.le.u32 %p49, %r4979, %r308; | |
mov.u32 %r4981, %r308; | |
mov.u32 %r4982, %r307; | |
@%p49 bra BB0_98; | |
st.local.u32 [%rd1+192], %r308; | |
st.local.u32 [%rd1+200], %r4979; | |
st.local.u32 [%rd1+196], %r307; | |
st.local.u32 [%rd1+204], %r4980; | |
mov.u32 %r4712, %r4980; | |
mov.u32 %r4714, %r4979; | |
mov.u32 %r4980, %r307; | |
mov.u32 %r4979, %r308; | |
mov.u32 %r4981, %r4714; | |
mov.u32 %r4982, %r4712; | |
BB0_98: | |
mov.u32 %r4971, %r4979; | |
mov.u32 %r4972, %r4980; | |
mov.u32 %r4973, %r4981; | |
mov.u32 %r4974, %r4982; | |
mul.lo.s64 %rd512, %rd25, 1792; | |
add.s64 %rd513, %rd3, %rd512; | |
bfe.u32 %r1905, %r299, 22, 6; | |
mul.wide.u32 %rd514, %r1905, 28; | |
add.s64 %rd515, %rd513, %rd514; | |
ld.global.u32 %r313, [%rd515+-8]; | |
and.b32 %r1906, %r313, 65535; | |
cvt.u64.u32 %rd27, %r1906; | |
bfe.u32 %r1907, %r313, 16, 6; | |
mul.wide.u32 %rd516, %r1906, 1792; | |
add.s64 %rd517, %rd136, %rd516; | |
mul.wide.u32 %rd518, %r1907, 28; | |
add.s64 %rd519, %rd517, %rd518; | |
ld.global.u32 %r1908, [%rd519]; | |
and.b32 %r1909, %r1908, 65535; | |
bfe.u32 %r1910, %r1908, 16, 6; | |
mul.wide.u32 %rd520, %r1909, 1792; | |
add.s64 %rd521, %rd135, %rd520; | |
mul.wide.u32 %rd522, %r1910, 28; | |
add.s64 %rd523, %rd521, %rd522; | |
ld.global.u32 %r1911, [%rd523]; | |
and.b32 %r1912, %r1911, 65535; | |
shl.b32 %r1913, %r1912, 6; | |
bfe.u32 %r1914, %r1911, 16, 6; | |
or.b32 %r314, %r1913, %r1914; | |
st.local.u32 [%rd1+208], %r314; | |
bfe.u32 %r1915, %r1908, 22, 6; | |
mul.wide.u32 %rd524, %r1915, 28; | |
add.s64 %rd525, %rd521, %rd524; | |
ld.global.u32 %r1916, [%rd525]; | |
and.b32 %r1917, %r1916, 65535; | |
shl.b32 %r1918, %r1917, 6; | |
bfe.u32 %r1919, %r1916, 16, 6; | |
or.b32 %r4992, %r1918, %r1919; | |
st.local.u32 [%rd1+212], %r4992; | |
setp.le.u32 %p50, %r314, %r4992; | |
mov.u32 %r4991, %r314; | |
@%p50 bra BB0_100; | |
st.local.u32 [%rd1+208], %r4992; | |
st.local.u32 [%rd1+212], %r314; | |
mov.u32 %r4729, %r4992; | |
mov.u32 %r4992, %r314; | |
mov.u32 %r4991, %r4729; | |
BB0_100: | |
mov.u32 %r4987, %r4991; | |
mov.u32 %r4988, %r4992; | |
bfe.u32 %r1920, %r313, 22, 6; | |
mul.lo.s64 %rd526, %rd27, 1792; | |
add.s64 %rd527, %rd136, %rd526; | |
mul.wide.u32 %rd528, %r1920, 28; | |
add.s64 %rd529, %rd527, %rd528; | |
ld.global.u32 %r1921, [%rd529]; | |
and.b32 %r1922, %r1921, 65535; | |
bfe.u32 %r1923, %r1921, 16, 6; | |
mul.wide.u32 %rd530, %r1922, 1792; | |
add.s64 %rd531, %rd135, %rd530; | |
mul.wide.u32 %rd532, %r1923, 28; | |
add.s64 %rd533, %rd531, %rd532; | |
ld.global.u32 %r1924, [%rd533]; | |
and.b32 %r1925, %r1924, 65535; | |
shl.b32 %r1926, %r1925, 6; | |
bfe.u32 %r1927, %r1924, 16, 6; | |
or.b32 %r318, %r1926, %r1927; | |
st.local.u32 [%rd1+216], %r318; | |
bfe.u32 %r1928, %r1921, 22, 6; | |
mul.wide.u32 %rd534, %r1928, 28; | |
add.s64 %rd535, %rd531, %rd534; | |
ld.global.u32 %r1929, [%rd535]; | |
and.b32 %r1930, %r1929, 65535; | |
shl.b32 %r1931, %r1930, 6; | |
bfe.u32 %r1932, %r1929, 16, 6; | |
or.b32 %r4994, %r1931, %r1932; | |
st.local.u32 [%rd1+220], %r4994; | |
setp.le.u32 %p51, %r318, %r4994; | |
mov.u32 %r4993, %r318; | |
@%p51 bra BB0_102; | |
st.local.u32 [%rd1+216], %r4994; | |
st.local.u32 [%rd1+220], %r318; | |
mov.u32 %r4735, %r4994; | |
mov.u32 %r4994, %r318; | |
mov.u32 %r4993, %r4735; | |
BB0_102: | |
mov.u32 %r321, %r4993; | |
mov.u32 %r320, %r4994; | |
setp.le.u32 %p52, %r4987, %r321; | |
mov.u32 %r4989, %r321; | |
mov.u32 %r4990, %r320; | |
@%p52 bra BB0_104; | |
st.local.u32 [%rd1+208], %r321; | |
st.local.u32 [%rd1+216], %r4987; | |
st.local.u32 [%rd1+212], %r320; | |
st.local.u32 [%rd1+220], %r4988; | |
mov.u32 %r4732, %r4988; | |
mov.u32 %r4734, %r4987; | |
mov.u32 %r4988, %r320; | |
mov.u32 %r4987, %r321; | |
mov.u32 %r4989, %r4734; | |
mov.u32 %r4990, %r4732; | |
BB0_104: | |
mov.u32 %r325, %r4987; | |
mov.u32 %r324, %r4988; | |
mov.u32 %r323, %r4989; | |
mov.u32 %r322, %r4990; | |
setp.le.u32 %p53, %r4971, %r325; | |
mov.u32 %r4975, %r325; | |
mov.u32 %r4976, %r324; | |
mov.u32 %r4977, %r323; | |
mov.u32 %r4978, %r322; | |
@%p53 bra BB0_106; | |
st.local.u32 [%rd1+192], %r325; | |
st.local.u32 [%rd1+208], %r4971; | |
st.local.u32 [%rd1+196], %r324; | |
st.local.u32 [%rd1+212], %r4972; | |
st.local.u32 [%rd1+200], %r323; | |
st.local.u32 [%rd1+216], %r4973; | |
st.local.u32 [%rd1+204], %r322; | |
st.local.u32 [%rd1+220], %r4974; | |
mov.u32 %r4722, %r4974; | |
mov.u32 %r4724, %r4973; | |
mov.u32 %r4726, %r4972; | |
mov.u32 %r4728, %r4971; | |
mov.u32 %r4974, %r322; | |
mov.u32 %r4973, %r323; | |
mov.u32 %r4972, %r324; | |
mov.u32 %r4971, %r325; | |
mov.u32 %r4975, %r4728; | |
mov.u32 %r4976, %r4726; | |
mov.u32 %r4977, %r4724; | |
mov.u32 %r4978, %r4722; | |
BB0_106: | |
mov.u32 %r4955, %r4971; | |
mov.u32 %r4956, %r4972; | |
mov.u32 %r4957, %r4973; | |
mov.u32 %r4958, %r4974; | |
mov.u32 %r4959, %r4975; | |
mov.u32 %r4960, %r4976; | |
mov.u32 %r4961, %r4977; | |
mov.u32 %r4962, %r4978; | |
mul.lo.s64 %rd536, %rd24, 1792; | |
add.s64 %rd537, %rd136, %rd536; | |
bfe.u32 %r1933, %r298, 22, 6; | |
mul.wide.u32 %rd538, %r1933, 28; | |
add.s64 %rd539, %rd537, %rd538; | |
ld.global.u32 %r334, [%rd539+4]; | |
and.b32 %r1934, %r334, 65535; | |
mul.wide.u32 %rd540, %r1934, 1792; | |
add.s64 %rd541, %rd3, %rd540; | |
cvt.u64.u32 %rd28, %r1934; | |
bfe.u32 %r1935, %r334, 16, 6; | |
mul.wide.u32 %rd542, %r1935, 28; | |
add.s64 %rd543, %rd541, %rd542; | |
ld.global.u32 %r335, [%rd543+-8]; | |
and.b32 %r1936, %r335, 65535; | |
cvt.u64.u32 %rd29, %r1936; | |
bfe.u32 %r1937, %r335, 16, 6; | |
mul.wide.u32 %rd544, %r1936, 1792; | |
add.s64 %rd545, %rd136, %rd544; | |
mul.wide.u32 %rd546, %r1937, 28; | |
add.s64 %rd547, %rd545, %rd546; | |
ld.global.u32 %r1938, [%rd547]; | |
and.b32 %r1939, %r1938, 65535; | |
bfe.u32 %r1940, %r1938, 16, 6; | |
mul.wide.u32 %rd548, %r1939, 1792; | |
add.s64 %rd549, %rd135, %rd548; | |
mul.wide.u32 %rd550, %r1940, 28; | |
add.s64 %rd551, %rd549, %rd550; | |
ld.global.u32 %r1941, [%rd551]; | |
and.b32 %r1942, %r1941, 65535; | |
shl.b32 %r1943, %r1942, 6; | |
bfe.u32 %r1944, %r1941, 16, 6; | |
or.b32 %r336, %r1943, %r1944; | |
st.local.u32 [%rd1+224], %r336; | |
bfe.u32 %r1945, %r1938, 22, 6; | |
mul.wide.u32 %rd552, %r1945, 28; | |
add.s64 %rd553, %rd549, %rd552; | |
ld.global.u32 %r1946, [%rd553]; | |
and.b32 %r1947, %r1946, 65535; | |
shl.b32 %r1948, %r1947, 6; | |
bfe.u32 %r1949, %r1946, 16, 6; | |
or.b32 %r5008, %r1948, %r1949; | |
st.local.u32 [%rd1+228], %r5008; | |
setp.le.u32 %p54, %r336, %r5008; | |
mov.u32 %r5007, %r336; | |
@%p54 bra BB0_108; | |
st.local.u32 [%rd1+224], %r5008; | |
st.local.u32 [%rd1+228], %r336; | |
mov.u32 %r4765, %r5008; | |
mov.u32 %r5008, %r336; | |
mov.u32 %r5007, %r4765; | |
BB0_108: | |
mov.u32 %r5003, %r5007; | |
mov.u32 %r5004, %r5008; | |
bfe.u32 %r1950, %r335, 22, 6; | |
mul.lo.s64 %rd554, %rd29, 1792; | |
add.s64 %rd555, %rd136, %rd554; | |
mul.wide.u32 %rd556, %r1950, 28; | |
add.s64 %rd557, %rd555, %rd556; | |
ld.global.u32 %r1951, [%rd557]; | |
and.b32 %r1952, %r1951, 65535; | |
bfe.u32 %r1953, %r1951, 16, 6; | |
mul.wide.u32 %rd558, %r1952, 1792; | |
add.s64 %rd559, %rd135, %rd558; | |
mul.wide.u32 %rd560, %r1953, 28; | |
add.s64 %rd561, %rd559, %rd560; | |
ld.global.u32 %r1954, [%rd561]; | |
and.b32 %r1955, %r1954, 65535; | |
shl.b32 %r1956, %r1955, 6; | |
bfe.u32 %r1957, %r1954, 16, 6; | |
or.b32 %r340, %r1956, %r1957; | |
st.local.u32 [%rd1+232], %r340; | |
bfe.u32 %r1958, %r1951, 22, 6; | |
mul.wide.u32 %rd562, %r1958, 28; | |
add.s64 %rd563, %rd559, %rd562; | |
ld.global.u32 %r1959, [%rd563]; | |
and.b32 %r1960, %r1959, 65535; | |
shl.b32 %r1961, %r1960, 6; | |
bfe.u32 %r1962, %r1959, 16, 6; | |
or.b32 %r5010, %r1961, %r1962; | |
st.local.u32 [%rd1+236], %r5010; | |
setp.le.u32 %p55, %r340, %r5010; | |
mov.u32 %r5009, %r340; | |
@%p55 bra BB0_110; | |
st.local.u32 [%rd1+232], %r5010; | |
st.local.u32 [%rd1+236], %r340; | |
mov.u32 %r4771, %r5010; | |
mov.u32 %r5010, %r340; | |
mov.u32 %r5009, %r4771; | |
BB0_110: | |
mov.u32 %r343, %r5009; | |
mov.u32 %r342, %r5010; | |
setp.le.u32 %p56, %r5003, %r343; | |
mov.u32 %r5005, %r343; | |
mov.u32 %r5006, %r342; | |
@%p56 bra BB0_112; | |
st.local.u32 [%rd1+224], %r343; | |
st.local.u32 [%rd1+232], %r5003; | |
st.local.u32 [%rd1+228], %r342; | |
st.local.u32 [%rd1+236], %r5004; | |
mov.u32 %r4768, %r5004; | |
mov.u32 %r4770, %r5003; | |
mov.u32 %r5004, %r342; | |
mov.u32 %r5003, %r343; | |
mov.u32 %r5005, %r4770; | |
mov.u32 %r5006, %r4768; | |
BB0_112: | |
mov.u32 %r4995, %r5003; | |
mov.u32 %r4996, %r5004; | |
mov.u32 %r4997, %r5005; | |
mov.u32 %r4998, %r5006; | |
mul.lo.s64 %rd564, %rd28, 1792; | |
add.s64 %rd565, %rd3, %rd564; | |
bfe.u32 %r1963, %r334, 22, 6; | |
mul.wide.u32 %rd566, %r1963, 28; | |
add.s64 %rd567, %rd565, %rd566; | |
ld.global.u32 %r348, [%rd567+-8]; | |
and.b32 %r1964, %r348, 65535; | |
cvt.u64.u32 %rd30, %r1964; | |
bfe.u32 %r1965, %r348, 16, 6; | |
mul.wide.u32 %rd568, %r1964, 1792; | |
add.s64 %rd569, %rd136, %rd568; | |
mul.wide.u32 %rd570, %r1965, 28; | |
add.s64 %rd571, %rd569, %rd570; | |
ld.global.u32 %r1966, [%rd571]; | |
and.b32 %r1967, %r1966, 65535; | |
bfe.u32 %r1968, %r1966, 16, 6; | |
mul.wide.u32 %rd572, %r1967, 1792; | |
add.s64 %rd573, %rd135, %rd572; | |
mul.wide.u32 %rd574, %r1968, 28; | |
add.s64 %rd575, %rd573, %rd574; | |
ld.global.u32 %r1969, [%rd575]; | |
and.b32 %r1970, %r1969, 65535; | |
shl.b32 %r1971, %r1970, 6; | |
bfe.u32 %r1972, %r1969, 16, 6; | |
or.b32 %r349, %r1971, %r1972; | |
st.local.u32 [%rd1+240], %r349; | |
bfe.u32 %r1973, %r1966, 22, 6; | |
mul.wide.u32 %rd576, %r1973, 28; | |
add.s64 %rd577, %rd573, %rd576; | |
ld.global.u32 %r1974, [%rd577]; | |
and.b32 %r1975, %r1974, 65535; | |
shl.b32 %r1976, %r1975, 6; | |
bfe.u32 %r1977, %r1974, 16, 6; | |
or.b32 %r5016, %r1976, %r1977; | |
st.local.u32 [%rd1+244], %r5016; | |
setp.le.u32 %p57, %r349, %r5016; | |
mov.u32 %r5015, %r349; | |
@%p57 bra BB0_114; | |
st.local.u32 [%rd1+240], %r5016; | |
st.local.u32 [%rd1+244], %r349; | |
mov.u32 %r4785, %r5016; | |
mov.u32 %r5016, %r349; | |
mov.u32 %r5015, %r4785; | |
BB0_114: | |
mov.u32 %r5011, %r5015; | |
mov.u32 %r5012, %r5016; | |
bfe.u32 %r1978, %r348, 22, 6; | |
mul.lo.s64 %rd578, %rd30, 1792; | |
add.s64 %rd579, %rd136, %rd578; | |
mul.wide.u32 %rd580, %r1978, 28; | |
add.s64 %rd581, %rd579, %rd580; | |
ld.global.u32 %r1979, [%rd581]; | |
and.b32 %r1980, %r1979, 65535; | |
bfe.u32 %r1981, %r1979, 16, 6; | |
mul.wide.u32 %rd582, %r1980, 1792; | |
add.s64 %rd583, %rd135, %rd582; | |
mul.wide.u32 %rd584, %r1981, 28; | |
add.s64 %rd585, %rd583, %rd584; | |
ld.global.u32 %r1982, [%rd585]; | |
and.b32 %r1983, %r1982, 65535; | |
shl.b32 %r1984, %r1983, 6; | |
bfe.u32 %r1985, %r1982, 16, 6; | |
or.b32 %r353, %r1984, %r1985; | |
st.local.u32 [%rd1+248], %r353; | |
bfe.u32 %r1986, %r1979, 22, 6; | |
mul.wide.u32 %rd586, %r1986, 28; | |
add.s64 %rd587, %rd583, %rd586; | |
ld.global.u32 %r1987, [%rd587]; | |
and.b32 %r1988, %r1987, 65535; | |
shl.b32 %r1989, %r1988, 6; | |
bfe.u32 %r1990, %r1987, 16, 6; | |
or.b32 %r5018, %r1989, %r1990; | |
st.local.u32 [%rd1+252], %r5018; | |
setp.le.u32 %p58, %r353, %r5018; | |
mov.u32 %r5017, %r353; | |
@%p58 bra BB0_116; | |
st.local.u32 [%rd1+248], %r5018; | |
st.local.u32 [%rd1+252], %r353; | |
mov.u32 %r4791, %r5018; | |
mov.u32 %r5018, %r353; | |
mov.u32 %r5017, %r4791; | |
BB0_116: | |
mov.u32 %r356, %r5017; | |
mov.u32 %r355, %r5018; | |
setp.le.u32 %p59, %r5011, %r356; | |
mov.u32 %r5013, %r356; | |
mov.u32 %r5014, %r355; | |
@%p59 bra BB0_118; | |
st.local.u32 [%rd1+240], %r356; | |
st.local.u32 [%rd1+248], %r5011; | |
st.local.u32 [%rd1+244], %r355; | |
st.local.u32 [%rd1+252], %r5012; | |
mov.u32 %r4788, %r5012; | |
mov.u32 %r4790, %r5011; | |
mov.u32 %r5012, %r355; | |
mov.u32 %r5011, %r356; | |
mov.u32 %r5013, %r4790; | |
mov.u32 %r5014, %r4788; | |
BB0_118: | |
mov.u32 %r360, %r5011; | |
mov.u32 %r359, %r5012; | |
mov.u32 %r358, %r5013; | |
mov.u32 %r357, %r5014; | |
setp.le.u32 %p60, %r4995, %r360; | |
mov.u32 %r4999, %r360; | |
mov.u32 %r5000, %r359; | |
mov.u32 %r5001, %r358; | |
mov.u32 %r5002, %r357; | |
@%p60 bra BB0_120; | |
st.local.u32 [%rd1+224], %r360; | |
st.local.u32 [%rd1+240], %r4995; | |
st.local.u32 [%rd1+228], %r359; | |
st.local.u32 [%rd1+244], %r4996; | |
st.local.u32 [%rd1+232], %r358; | |
st.local.u32 [%rd1+248], %r4997; | |
st.local.u32 [%rd1+236], %r357; | |
st.local.u32 [%rd1+252], %r4998; | |
mov.u32 %r4778, %r4998; | |
mov.u32 %r4780, %r4997; | |
mov.u32 %r4782, %r4996; | |
mov.u32 %r4784, %r4995; | |
mov.u32 %r4998, %r357; | |
mov.u32 %r4997, %r358; | |
mov.u32 %r4996, %r359; | |
mov.u32 %r4995, %r360; | |
mov.u32 %r4999, %r4784; | |
mov.u32 %r5000, %r4782; | |
mov.u32 %r5001, %r4780; | |
mov.u32 %r5002, %r4778; | |
BB0_120: | |
mov.u32 %r368, %r4995; | |
mov.u32 %r367, %r4996; | |
mov.u32 %r366, %r4997; | |
mov.u32 %r365, %r4998; | |
mov.u32 %r364, %r4999; | |
mov.u32 %r363, %r5000; | |
mov.u32 %r362, %r5001; | |
mov.u32 %r361, %r5002; | |
setp.le.u32 %p61, %r4955, %r368; | |
mov.u32 %r4963, %r368; | |
mov.u32 %r4964, %r367; | |
mov.u32 %r4965, %r366; | |
mov.u32 %r4966, %r365; | |
mov.u32 %r4967, %r364; | |
mov.u32 %r4968, %r363; | |
mov.u32 %r4969, %r362; | |
mov.u32 %r4970, %r361; | |
@%p61 bra BB0_122; | |
st.local.u32 [%rd1+192], %r368; | |
st.local.u32 [%rd1+224], %r4955; | |
st.local.u32 [%rd1+196], %r367; | |
st.local.u32 [%rd1+228], %r4956; | |
st.local.u32 [%rd1+200], %r366; | |
st.local.u32 [%rd1+232], %r4957; | |
st.local.u32 [%rd1+204], %r365; | |
st.local.u32 [%rd1+236], %r4958; | |
st.local.u32 [%rd1+208], %r364; | |
st.local.u32 [%rd1+240], %r4959; | |
st.local.u32 [%rd1+212], %r363; | |
st.local.u32 [%rd1+244], %r4960; | |
st.local.u32 [%rd1+216], %r362; | |
st.local.u32 [%rd1+248], %r4961; | |
st.local.u32 [%rd1+220], %r361; | |
st.local.u32 [%rd1+252], %r4962; | |
mov.u32 %r4750, %r4962; | |
mov.u32 %r4752, %r4961; | |
mov.u32 %r4754, %r4960; | |
mov.u32 %r4756, %r4959; | |
mov.u32 %r4758, %r4958; | |
mov.u32 %r4760, %r4957; | |
mov.u32 %r4762, %r4956; | |
mov.u32 %r4764, %r4955; | |
mov.u32 %r4962, %r361; | |
mov.u32 %r4961, %r362; | |
mov.u32 %r4960, %r363; | |
mov.u32 %r4959, %r364; | |
mov.u32 %r4958, %r365; | |
mov.u32 %r4957, %r366; | |
mov.u32 %r4956, %r367; | |
mov.u32 %r4955, %r368; | |
mov.u32 %r4963, %r4764; | |
mov.u32 %r4964, %r4762; | |
mov.u32 %r4965, %r4760; | |
mov.u32 %r4966, %r4758; | |
mov.u32 %r4967, %r4756; | |
mov.u32 %r4968, %r4754; | |
mov.u32 %r4969, %r4752; | |
mov.u32 %r4970, %r4750; | |
BB0_122: | |
mov.u32 %r384, %r4955; | |
mov.u32 %r383, %r4956; | |
mov.u32 %r382, %r4957; | |
mov.u32 %r381, %r4958; | |
mov.u32 %r380, %r4959; | |
mov.u32 %r379, %r4960; | |
mov.u32 %r378, %r4961; | |
mov.u32 %r377, %r4962; | |
mov.u32 %r376, %r4963; | |
mov.u32 %r375, %r4964; | |
mov.u32 %r374, %r4965; | |
mov.u32 %r373, %r4966; | |
mov.u32 %r372, %r4967; | |
mov.u32 %r371, %r4968; | |
mov.u32 %r370, %r4969; | |
mov.u32 %r369, %r4970; | |
setp.le.u32 %p62, %r4859, %r384; | |
mov.u32 %r4875, %r384; | |
mov.u32 %r4876, %r383; | |
mov.u32 %r4877, %r382; | |
mov.u32 %r4878, %r381; | |
mov.u32 %r4879, %r380; | |
mov.u32 %r4880, %r379; | |
mov.u32 %r4881, %r378; | |
mov.u32 %r4882, %r377; | |
mov.u32 %r4883, %r376; | |
mov.u32 %r4884, %r375; | |
mov.u32 %r4885, %r374; | |
mov.u32 %r4886, %r373; | |
mov.u32 %r4887, %r372; | |
mov.u32 %r4888, %r371; | |
mov.u32 %r4889, %r370; | |
mov.u32 %r4890, %r369; | |
@%p62 bra BB0_124; | |
st.local.u32 [%rd1+128], %r384; | |
st.local.u32 [%rd1+192], %r4859; | |
st.local.u32 [%rd1+132], %r383; | |
st.local.u32 [%rd1+196], %r4860; | |
st.local.u32 [%rd1+136], %r382; | |
st.local.u32 [%rd1+200], %r4861; | |
st.local.u32 [%rd1+140], %r381; | |
st.local.u32 [%rd1+204], %r4862; | |
st.local.u32 [%rd1+144], %r380; | |
st.local.u32 [%rd1+208], %r4863; | |
st.local.u32 [%rd1+148], %r379; | |
st.local.u32 [%rd1+212], %r4864; | |
st.local.u32 [%rd1+152], %r378; | |
st.local.u32 [%rd1+216], %r4865; | |
st.local.u32 [%rd1+156], %r377; | |
st.local.u32 [%rd1+220], %r4866; | |
st.local.u32 [%rd1+160], %r376; | |
st.local.u32 [%rd1+224], %r4867; | |
st.local.u32 [%rd1+164], %r375; | |
st.local.u32 [%rd1+228], %r4868; | |
st.local.u32 [%rd1+168], %r374; | |
st.local.u32 [%rd1+232], %r4869; | |
st.local.u32 [%rd1+172], %r373; | |
st.local.u32 [%rd1+236], %r4870; | |
st.local.u32 [%rd1+176], %r372; | |
st.local.u32 [%rd1+240], %r4871; | |
st.local.u32 [%rd1+180], %r371; | |
st.local.u32 [%rd1+244], %r4872; | |
st.local.u32 [%rd1+184], %r370; | |
st.local.u32 [%rd1+248], %r4873; | |
st.local.u32 [%rd1+188], %r369; | |
st.local.u32 [%rd1+252], %r4874; | |
mov.u32 %r4678, %r4874; | |
mov.u32 %r4680, %r4873; | |
mov.u32 %r4682, %r4872; | |
mov.u32 %r4684, %r4871; | |
mov.u32 %r4686, %r4870; | |
mov.u32 %r4688, %r4869; | |
mov.u32 %r4690, %r4868; | |
mov.u32 %r4692, %r4867; | |
mov.u32 %r4694, %r4866; | |
mov.u32 %r4696, %r4865; | |
mov.u32 %r4698, %r4864; | |
mov.u32 %r4700, %r4863; | |
mov.u32 %r4702, %r4862; | |
mov.u32 %r4704, %r4861; | |
mov.u32 %r4706, %r4860; | |
mov.u32 %r4708, %r4859; | |
mov.u32 %r4874, %r369; | |
mov.u32 %r4873, %r370; | |
mov.u32 %r4872, %r371; | |
mov.u32 %r4871, %r372; | |
mov.u32 %r4870, %r373; | |
mov.u32 %r4869, %r374; | |
mov.u32 %r4868, %r375; | |
mov.u32 %r4867, %r376; | |
mov.u32 %r4866, %r377; | |
mov.u32 %r4865, %r378; | |
mov.u32 %r4864, %r379; | |
mov.u32 %r4863, %r380; | |
mov.u32 %r4862, %r381; | |
mov.u32 %r4861, %r382; | |
mov.u32 %r4860, %r383; | |
mov.u32 %r4859, %r384; | |
mov.u32 %r4875, %r4708; | |
mov.u32 %r4876, %r4706; | |
mov.u32 %r4877, %r4704; | |
mov.u32 %r4878, %r4702; | |
mov.u32 %r4879, %r4700; | |
mov.u32 %r4880, %r4698; | |
mov.u32 %r4881, %r4696; | |
mov.u32 %r4882, %r4694; | |
mov.u32 %r4883, %r4692; | |
mov.u32 %r4884, %r4690; | |
mov.u32 %r4885, %r4688; | |
mov.u32 %r4886, %r4686; | |
mov.u32 %r4887, %r4684; | |
mov.u32 %r4888, %r4682; | |
mov.u32 %r4889, %r4680; | |
mov.u32 %r4890, %r4678; | |
BB0_124: | |
mov.u32 %r416, %r4859; | |
setp.le.u32 %p63, %r209, %r416; | |
mov.u32 %r4858, %r209; | |
@%p63 bra BB0_126; | |
st.local.u32 [%rd1], %r416; | |
st.local.u32 [%rd1+128], %r209; | |
st.local.u32 [%rd1+4], %r4860; | |
st.local.u32 [%rd1+132], %r5020; | |
st.local.u32 [%rd1+8], %r4861; | |
st.local.u32 [%rd1+136], %r5021; | |
st.local.u32 [%rd1+12], %r4862; | |
st.local.u32 [%rd1+140], %r5022; | |
st.local.u32 [%rd1+16], %r4863; | |
st.local.u32 [%rd1+144], %r5023; | |
st.local.u32 [%rd1+20], %r4864; | |
st.local.u32 [%rd1+148], %r5024; | |
st.local.u32 [%rd1+24], %r4865; | |
st.local.u32 [%rd1+152], %r5025; | |
st.local.u32 [%rd1+28], %r4866; | |
st.local.u32 [%rd1+156], %r5026; | |
st.local.u32 [%rd1+32], %r4867; | |
st.local.u32 [%rd1+160], %r5027; | |
st.local.u32 [%rd1+36], %r4868; | |
st.local.u32 [%rd1+164], %r5028; | |
st.local.u32 [%rd1+40], %r4869; | |
st.local.u32 [%rd1+168], %r5029; | |
st.local.u32 [%rd1+44], %r4870; | |
st.local.u32 [%rd1+172], %r5030; | |
st.local.u32 [%rd1+48], %r4871; | |
st.local.u32 [%rd1+176], %r5031; | |
st.local.u32 [%rd1+52], %r4872; | |
st.local.u32 [%rd1+180], %r5032; | |
st.local.u32 [%rd1+56], %r4873; | |
st.local.u32 [%rd1+184], %r5033; | |
st.local.u32 [%rd1+60], %r4874; | |
st.local.u32 [%rd1+188], %r5034; | |
st.local.u32 [%rd1+64], %r4875; | |
st.local.u32 [%rd1+192], %r5035; | |
st.local.u32 [%rd1+68], %r4876; | |
st.local.u32 [%rd1+196], %r5036; | |
st.local.u32 [%rd1+72], %r4877; | |
st.local.u32 [%rd1+200], %r5037; | |
st.local.u32 [%rd1+76], %r4878; | |
st.local.u32 [%rd1+204], %r5038; | |
st.local.u32 [%rd1+80], %r4879; | |
st.local.u32 [%rd1+208], %r5039; | |
st.local.u32 [%rd1+84], %r4880; | |
st.local.u32 [%rd1+212], %r5040; | |
st.local.u32 [%rd1+88], %r4881; | |
st.local.u32 [%rd1+216], %r5041; | |
st.local.u32 [%rd1+92], %r4882; | |
st.local.u32 [%rd1+220], %r5042; | |
st.local.u32 [%rd1+96], %r4883; | |
st.local.u32 [%rd1+224], %r5043; | |
st.local.u32 [%rd1+100], %r4884; | |
st.local.u32 [%rd1+228], %r5044; | |
st.local.u32 [%rd1+104], %r4885; | |
st.local.u32 [%rd1+232], %r5045; | |
st.local.u32 [%rd1+108], %r4886; | |
st.local.u32 [%rd1+236], %r5046; | |
st.local.u32 [%rd1+112], %r4887; | |
st.local.u32 [%rd1+240], %r5047; | |
st.local.u32 [%rd1+116], %r4888; | |
st.local.u32 [%rd1+244], %r5048; | |
st.local.u32 [%rd1+120], %r4889; | |
st.local.u32 [%rd1+248], %r5049; | |
st.local.u32 [%rd1+124], %r4890; | |
st.local.u32 [%rd1+252], %r5050; | |
mov.u32 %r4858, %r416; | |
BB0_126: | |
mov.u32 %r4857, %r4858; | |
bfe.u32 %r1991, %r1, 22, 6; | |
mul.wide.u32 %rd591, %r1991, 28; | |
add.s64 %rd592, %rd143, %rd591; | |
ld.global.u32 %r418, [%rd592]; | |
and.b32 %r1993, %r418, 65535; | |
mul.wide.u32 %rd593, %r1993, 1792; | |
add.s64 %rd594, %rd146, %rd593; | |
bfe.u32 %r1994, %r418, 16, 6; | |
mul.wide.u32 %rd595, %r1994, 28; | |
add.s64 %rd596, %rd594, %rd595; | |
ld.global.u32 %r419, [%rd596+4]; | |
and.b32 %r1995, %r419, 65535; | |
mul.wide.u32 %rd597, %r1995, 1792; | |
add.s64 %rd598, %rd3, %rd597; | |
bfe.u32 %r1996, %r419, 16, 6; | |
mul.wide.u32 %rd599, %r1996, 28; | |
add.s64 %rd600, %rd598, %rd599; | |
ld.global.u32 %r420, [%rd600+-4]; | |
and.b32 %r1997, %r420, 65535; | |
bfe.u32 %r1998, %r420, 16, 6; | |
mul.wide.u32 %rd601, %r1997, 1792; | |
add.s64 %rd602, %rd146, %rd601; | |
mul.wide.u32 %rd603, %r1998, 28; | |
add.s64 %rd604, %rd602, %rd603; | |
ld.global.u32 %r421, [%rd604]; | |
and.b32 %r1999, %r421, 65535; | |
mul.wide.u32 %rd605, %r1999, 1792; | |
add.s64 %rd606, %rd3, %rd605; | |
cvt.u64.u32 %rd31, %r1993; | |
cvt.u64.u32 %rd32, %r1995; | |
cvt.u64.u32 %rd33, %r1997; | |
cvt.u64.u32 %rd34, %r1999; | |
bfe.u32 %r2000, %r421, 16, 6; | |
mul.wide.u32 %rd607, %r2000, 28; | |
add.s64 %rd608, %rd606, %rd607; | |
ld.global.u32 %r422, [%rd608+-8]; | |
and.b32 %r2001, %r422, 65535; | |
cvt.u64.u32 %rd35, %r2001; | |
bfe.u32 %r2002, %r422, 16, 6; | |
mul.wide.u32 %rd609, %r2001, 1792; | |
add.s64 %rd610, %rd136, %rd609; | |
mul.wide.u32 %rd611, %r2002, 28; | |
add.s64 %rd612, %rd610, %rd611; | |
ld.global.u32 %r2003, [%rd612]; | |
and.b32 %r2004, %r2003, 65535; | |
bfe.u32 %r2005, %r2003, 16, 6; | |
mul.wide.u32 %rd613, %r2004, 1792; | |
add.s64 %rd614, %rd135, %rd613; | |
mul.wide.u32 %rd615, %r2005, 28; | |
add.s64 %rd616, %rd614, %rd615; | |
ld.global.u32 %r2006, [%rd616]; | |
and.b32 %r2007, %r2006, 65535; | |
shl.b32 %r2008, %r2007, 6; | |
bfe.u32 %r2009, %r2006, 16, 6; | |
or.b32 %r423, %r2008, %r2009; | |
st.local.u32 [%rd1+256], %r423; | |
bfe.u32 %r2010, %r2003, 22, 6; | |
mul.wide.u32 %rd617, %r2010, 28; | |
add.s64 %rd618, %rd614, %rd617; | |
ld.global.u32 %r2011, [%rd618]; | |
and.b32 %r2012, %r2011, 65535; | |
shl.b32 %r2013, %r2012, 6; | |
bfe.u32 %r2014, %r2011, 16, 6; | |
or.b32 %r4241, %r2013, %r2014; | |
st.local.u32 [%rd1+260], %r4241; | |
setp.le.u32 %p64, %r423, %r4241; | |
mov.u32 %r4240, %r423; | |
@%p64 bra BB0_128; | |
st.local.u32 [%rd1+256], %r4241; | |
st.local.u32 [%rd1+260], %r423; | |
mov.u32 %r3919, %r4241; | |
mov.u32 %r4241, %r423; | |
mov.u32 %r4240, %r3919; | |
BB0_128: | |
mov.u32 %r4236, %r4240; | |
mov.u32 %r4237, %r4241; | |
bfe.u32 %r2015, %r422, 22, 6; | |
mul.lo.s64 %rd619, %rd35, 1792; | |
add.s64 %rd620, %rd136, %rd619; | |
mul.wide.u32 %rd621, %r2015, 28; | |
add.s64 %rd622, %rd620, %rd621; | |
ld.global.u32 %r2016, [%rd622]; | |
and.b32 %r2017, %r2016, 65535; | |
bfe.u32 %r2018, %r2016, 16, 6; | |
mul.wide.u32 %rd623, %r2017, 1792; | |
add.s64 %rd624, %rd135, %rd623; | |
mul.wide.u32 %rd625, %r2018, 28; | |
add.s64 %rd626, %rd624, %rd625; | |
ld.global.u32 %r2019, [%rd626]; | |
and.b32 %r2020, %r2019, 65535; | |
shl.b32 %r2021, %r2020, 6; | |
bfe.u32 %r2022, %r2019, 16, 6; | |
or.b32 %r427, %r2021, %r2022; | |
st.local.u32 [%rd1+264], %r427; | |
bfe.u32 %r2023, %r2016, 22, 6; | |
mul.wide.u32 %rd627, %r2023, 28; | |
add.s64 %rd628, %rd624, %rd627; | |
ld.global.u32 %r2024, [%rd628]; | |
and.b32 %r2025, %r2024, 65535; | |
shl.b32 %r2026, %r2025, 6; | |
bfe.u32 %r2027, %r2024, 16, 6; | |
or.b32 %r4243, %r2026, %r2027; | |
st.local.u32 [%rd1+268], %r4243; | |
setp.le.u32 %p65, %r427, %r4243; | |
mov.u32 %r4242, %r427; | |
@%p65 bra BB0_130; | |
st.local.u32 [%rd1+264], %r4243; | |
st.local.u32 [%rd1+268], %r427; | |
mov.u32 %r3925, %r4243; | |
mov.u32 %r4243, %r427; | |
mov.u32 %r4242, %r3925; | |
BB0_130: | |
mov.u32 %r430, %r4242; | |
mov.u32 %r429, %r4243; | |
setp.le.u32 %p66, %r4236, %r430; | |
mov.u32 %r4238, %r430; | |
mov.u32 %r4239, %r429; | |
@%p66 bra BB0_132; | |
st.local.u32 [%rd1+256], %r430; | |
st.local.u32 [%rd1+264], %r4236; | |
st.local.u32 [%rd1+260], %r429; | |
st.local.u32 [%rd1+268], %r4237; | |
mov.u32 %r3922, %r4237; | |
mov.u32 %r3924, %r4236; | |
mov.u32 %r4237, %r429; | |
mov.u32 %r4236, %r430; | |
mov.u32 %r4238, %r3924; | |
mov.u32 %r4239, %r3922; | |
BB0_132: | |
mov.u32 %r4228, %r4236; | |
mov.u32 %r4229, %r4237; | |
mov.u32 %r4230, %r4238; | |
mov.u32 %r4231, %r4239; | |
mul.lo.s64 %rd629, %rd34, 1792; | |
add.s64 %rd630, %rd3, %rd629; | |
bfe.u32 %r2028, %r421, 22, 6; | |
mul.wide.u32 %rd631, %r2028, 28; | |
add.s64 %rd632, %rd630, %rd631; | |
ld.global.u32 %r435, [%rd632+-8]; | |
and.b32 %r2029, %r435, 65535; | |
cvt.u64.u32 %rd36, %r2029; | |
bfe.u32 %r2030, %r435, 16, 6; | |
mul.wide.u32 %rd633, %r2029, 1792; | |
add.s64 %rd634, %rd136, %rd633; | |
mul.wide.u32 %rd635, %r2030, 28; | |
add.s64 %rd636, %rd634, %rd635; | |
ld.global.u32 %r2031, [%rd636]; | |
and.b32 %r2032, %r2031, 65535; | |
bfe.u32 %r2033, %r2031, 16, 6; | |
mul.wide.u32 %rd637, %r2032, 1792; | |
add.s64 %rd638, %rd135, %rd637; | |
mul.wide.u32 %rd639, %r2033, 28; | |
add.s64 %rd640, %rd638, %rd639; | |
ld.global.u32 %r2034, [%rd640]; | |
and.b32 %r2035, %r2034, 65535; | |
shl.b32 %r2036, %r2035, 6; | |
bfe.u32 %r2037, %r2034, 16, 6; | |
or.b32 %r436, %r2036, %r2037; | |
st.local.u32 [%rd1+272], %r436; | |
bfe.u32 %r2038, %r2031, 22, 6; | |
mul.wide.u32 %rd641, %r2038, 28; | |
add.s64 %rd642, %rd638, %rd641; | |
ld.global.u32 %r2039, [%rd642]; | |
and.b32 %r2040, %r2039, 65535; | |
shl.b32 %r2041, %r2040, 6; | |
bfe.u32 %r2042, %r2039, 16, 6; | |
or.b32 %r4249, %r2041, %r2042; | |
st.local.u32 [%rd1+276], %r4249; | |
setp.le.u32 %p67, %r436, %r4249; | |
mov.u32 %r4248, %r436; | |
@%p67 bra BB0_134; | |
st.local.u32 [%rd1+272], %r4249; | |
st.local.u32 [%rd1+276], %r436; | |
mov.u32 %r3939, %r4249; | |
mov.u32 %r4249, %r436; | |
mov.u32 %r4248, %r3939; | |
BB0_134: | |
mov.u32 %r4244, %r4248; | |
mov.u32 %r4245, %r4249; | |
bfe.u32 %r2043, %r435, 22, 6; | |
mul.lo.s64 %rd643, %rd36, 1792; | |
add.s64 %rd644, %rd136, %rd643; | |
mul.wide.u32 %rd645, %r2043, 28; | |
add.s64 %rd646, %rd644, %rd645; | |
ld.global.u32 %r2044, [%rd646]; | |
and.b32 %r2045, %r2044, 65535; | |
bfe.u32 %r2046, %r2044, 16, 6; | |
mul.wide.u32 %rd647, %r2045, 1792; | |
add.s64 %rd648, %rd135, %rd647; | |
mul.wide.u32 %rd649, %r2046, 28; | |
add.s64 %rd650, %rd648, %rd649; | |
ld.global.u32 %r2047, [%rd650]; | |
and.b32 %r2048, %r2047, 65535; | |
shl.b32 %r2049, %r2048, 6; | |
bfe.u32 %r2050, %r2047, 16, 6; | |
or.b32 %r440, %r2049, %r2050; | |
st.local.u32 [%rd1+280], %r440; | |
bfe.u32 %r2051, %r2044, 22, 6; | |
mul.wide.u32 %rd651, %r2051, 28; | |
add.s64 %rd652, %rd648, %rd651; | |
ld.global.u32 %r2052, [%rd652]; | |
and.b32 %r2053, %r2052, 65535; | |
shl.b32 %r2054, %r2053, 6; | |
bfe.u32 %r2055, %r2052, 16, 6; | |
or.b32 %r4251, %r2054, %r2055; | |
st.local.u32 [%rd1+284], %r4251; | |
setp.le.u32 %p68, %r440, %r4251; | |
mov.u32 %r4250, %r440; | |
@%p68 bra BB0_136; | |
st.local.u32 [%rd1+280], %r4251; | |
st.local.u32 [%rd1+284], %r440; | |
mov.u32 %r3945, %r4251; | |
mov.u32 %r4251, %r440; | |
mov.u32 %r4250, %r3945; | |
BB0_136: | |
mov.u32 %r443, %r4250; | |
mov.u32 %r442, %r4251; | |
setp.le.u32 %p69, %r4244, %r443; | |
mov.u32 %r4246, %r443; | |
mov.u32 %r4247, %r442; | |
@%p69 bra BB0_138; | |
st.local.u32 [%rd1+272], %r443; | |
st.local.u32 [%rd1+280], %r4244; | |
st.local.u32 [%rd1+276], %r442; | |
st.local.u32 [%rd1+284], %r4245; | |
mov.u32 %r3942, %r4245; | |
mov.u32 %r3944, %r4244; | |
mov.u32 %r4245, %r442; | |
mov.u32 %r4244, %r443; | |
mov.u32 %r4246, %r3944; | |
mov.u32 %r4247, %r3942; | |
BB0_138: | |
mov.u32 %r447, %r4244; | |
mov.u32 %r446, %r4245; | |
mov.u32 %r445, %r4246; | |
mov.u32 %r444, %r4247; | |
setp.le.u32 %p70, %r4228, %r447; | |
mov.u32 %r4232, %r447; | |
mov.u32 %r4233, %r446; | |
mov.u32 %r4234, %r445; | |
mov.u32 %r4235, %r444; | |
@%p70 bra BB0_140; | |
st.local.u32 [%rd1+256], %r447; | |
st.local.u32 [%rd1+272], %r4228; | |
st.local.u32 [%rd1+260], %r446; | |
st.local.u32 [%rd1+276], %r4229; | |
st.local.u32 [%rd1+264], %r445; | |
st.local.u32 [%rd1+280], %r4230; | |
st.local.u32 [%rd1+268], %r444; | |
st.local.u32 [%rd1+284], %r4231; | |
mov.u32 %r3932, %r4231; | |
mov.u32 %r3934, %r4230; | |
mov.u32 %r3936, %r4229; | |
mov.u32 %r3938, %r4228; | |
mov.u32 %r4231, %r444; | |
mov.u32 %r4230, %r445; | |
mov.u32 %r4229, %r446; | |
mov.u32 %r4228, %r447; | |
mov.u32 %r4232, %r3938; | |
mov.u32 %r4233, %r3936; | |
mov.u32 %r4234, %r3934; | |
mov.u32 %r4235, %r3932; | |
BB0_140: | |
mov.u32 %r4212, %r4228; | |
mov.u32 %r4213, %r4229; | |
mov.u32 %r4214, %r4230; | |
mov.u32 %r4215, %r4231; | |
mov.u32 %r4216, %r4232; | |
mov.u32 %r4217, %r4233; | |
mov.u32 %r4218, %r4234; | |
mov.u32 %r4219, %r4235; | |
mul.lo.s64 %rd653, %rd33, 1792; | |
add.s64 %rd654, %rd136, %rd653; | |
bfe.u32 %r2056, %r420, 22, 6; | |
mul.wide.u32 %rd655, %r2056, 28; | |
add.s64 %rd656, %rd654, %rd655; | |
ld.global.u32 %r456, [%rd656+4]; | |
and.b32 %r2057, %r456, 65535; | |
mul.wide.u32 %rd657, %r2057, 1792; | |
add.s64 %rd658, %rd3, %rd657; | |
cvt.u64.u32 %rd37, %r2057; | |
bfe.u32 %r2058, %r456, 16, 6; | |
mul.wide.u32 %rd659, %r2058, 28; | |
add.s64 %rd660, %rd658, %rd659; | |
ld.global.u32 %r457, [%rd660+-8]; | |
and.b32 %r2059, %r457, 65535; | |
cvt.u64.u32 %rd38, %r2059; | |
bfe.u32 %r2060, %r457, 16, 6; | |
mul.wide.u32 %rd661, %r2059, 1792; | |
add.s64 %rd662, %rd136, %rd661; | |
mul.wide.u32 %rd663, %r2060, 28; | |
add.s64 %rd664, %rd662, %rd663; | |
ld.global.u32 %r2061, [%rd664]; | |
and.b32 %r2062, %r2061, 65535; | |
bfe.u32 %r2063, %r2061, 16, 6; | |
mul.wide.u32 %rd665, %r2062, 1792; | |
add.s64 %rd666, %rd135, %rd665; | |
mul.wide.u32 %rd667, %r2063, 28; | |
add.s64 %rd668, %rd666, %rd667; | |
ld.global.u32 %r2064, [%rd668]; | |
and.b32 %r2065, %r2064, 65535; | |
shl.b32 %r2066, %r2065, 6; | |
bfe.u32 %r2067, %r2064, 16, 6; | |
or.b32 %r458, %r2066, %r2067; | |
st.local.u32 [%rd1+288], %r458; | |
bfe.u32 %r2068, %r2061, 22, 6; | |
mul.wide.u32 %rd669, %r2068, 28; | |
add.s64 %rd670, %rd666, %rd669; | |
ld.global.u32 %r2069, [%rd670]; | |
and.b32 %r2070, %r2069, 65535; | |
shl.b32 %r2071, %r2070, 6; | |
bfe.u32 %r2072, %r2069, 16, 6; | |
or.b32 %r4265, %r2071, %r2072; | |
st.local.u32 [%rd1+292], %r4265; | |
setp.le.u32 %p71, %r458, %r4265; | |
mov.u32 %r4264, %r458; | |
@%p71 bra BB0_142; | |
st.local.u32 [%rd1+288], %r4265; | |
st.local.u32 [%rd1+292], %r458; | |
mov.u32 %r3975, %r4265; | |
mov.u32 %r4265, %r458; | |
mov.u32 %r4264, %r3975; | |
BB0_142: | |
mov.u32 %r4260, %r4264; | |
mov.u32 %r4261, %r4265; | |
bfe.u32 %r2073, %r457, 22, 6; | |
mul.lo.s64 %rd671, %rd38, 1792; | |
add.s64 %rd672, %rd136, %rd671; | |
mul.wide.u32 %rd673, %r2073, 28; | |
add.s64 %rd674, %rd672, %rd673; | |
ld.global.u32 %r2074, [%rd674]; | |
and.b32 %r2075, %r2074, 65535; | |
bfe.u32 %r2076, %r2074, 16, 6; | |
mul.wide.u32 %rd675, %r2075, 1792; | |
add.s64 %rd676, %rd135, %rd675; | |
mul.wide.u32 %rd677, %r2076, 28; | |
add.s64 %rd678, %rd676, %rd677; | |
ld.global.u32 %r2077, [%rd678]; | |
and.b32 %r2078, %r2077, 65535; | |
shl.b32 %r2079, %r2078, 6; | |
bfe.u32 %r2080, %r2077, 16, 6; | |
or.b32 %r462, %r2079, %r2080; | |
st.local.u32 [%rd1+296], %r462; | |
bfe.u32 %r2081, %r2074, 22, 6; | |
mul.wide.u32 %rd679, %r2081, 28; | |
add.s64 %rd680, %rd676, %rd679; | |
ld.global.u32 %r2082, [%rd680]; | |
and.b32 %r2083, %r2082, 65535; | |
shl.b32 %r2084, %r2083, 6; | |
bfe.u32 %r2085, %r2082, 16, 6; | |
or.b32 %r4267, %r2084, %r2085; | |
st.local.u32 [%rd1+300], %r4267; | |
setp.le.u32 %p72, %r462, %r4267; | |
mov.u32 %r4266, %r462; | |
@%p72 bra BB0_144; | |
st.local.u32 [%rd1+296], %r4267; | |
st.local.u32 [%rd1+300], %r462; | |
mov.u32 %r3981, %r4267; | |
mov.u32 %r4267, %r462; | |
mov.u32 %r4266, %r3981; | |
BB0_144: | |
mov.u32 %r465, %r4266; | |
mov.u32 %r464, %r4267; | |
setp.le.u32 %p73, %r4260, %r465; | |
mov.u32 %r4262, %r465; | |
mov.u32 %r4263, %r464; | |
@%p73 bra BB0_146; | |
st.local.u32 [%rd1+288], %r465; | |
st.local.u32 [%rd1+296], %r4260; | |
st.local.u32 [%rd1+292], %r464; | |
st.local.u32 [%rd1+300], %r4261; | |
mov.u32 %r3978, %r4261; | |
mov.u32 %r3980, %r4260; | |
mov.u32 %r4261, %r464; | |
mov.u32 %r4260, %r465; | |
mov.u32 %r4262, %r3980; | |
mov.u32 %r4263, %r3978; | |
BB0_146: | |
mov.u32 %r4252, %r4260; | |
mov.u32 %r4253, %r4261; | |
mov.u32 %r4254, %r4262; | |
mov.u32 %r4255, %r4263; | |
mul.lo.s64 %rd681, %rd37, 1792; | |
add.s64 %rd682, %rd3, %rd681; | |
bfe.u32 %r2086, %r456, 22, 6; | |
mul.wide.u32 %rd683, %r2086, 28; | |
add.s64 %rd684, %rd682, %rd683; | |
ld.global.u32 %r470, [%rd684+-8]; | |
and.b32 %r2087, %r470, 65535; | |
cvt.u64.u32 %rd39, %r2087; | |
bfe.u32 %r2088, %r470, 16, 6; | |
mul.wide.u32 %rd685, %r2087, 1792; | |
add.s64 %rd686, %rd136, %rd685; | |
mul.wide.u32 %rd687, %r2088, 28; | |
add.s64 %rd688, %rd686, %rd687; | |
ld.global.u32 %r2089, [%rd688]; | |
and.b32 %r2090, %r2089, 65535; | |
bfe.u32 %r2091, %r2089, 16, 6; | |
mul.wide.u32 %rd689, %r2090, 1792; | |
add.s64 %rd690, %rd135, %rd689; | |
mul.wide.u32 %rd691, %r2091, 28; | |
add.s64 %rd692, %rd690, %rd691; | |
ld.global.u32 %r2092, [%rd692]; | |
and.b32 %r2093, %r2092, 65535; | |
shl.b32 %r2094, %r2093, 6; | |
bfe.u32 %r2095, %r2092, 16, 6; | |
or.b32 %r471, %r2094, %r2095; | |
st.local.u32 [%rd1+304], %r471; | |
bfe.u32 %r2096, %r2089, 22, 6; | |
mul.wide.u32 %rd693, %r2096, 28; | |
add.s64 %rd694, %rd690, %rd693; | |
ld.global.u32 %r2097, [%rd694]; | |
and.b32 %r2098, %r2097, 65535; | |
shl.b32 %r2099, %r2098, 6; | |
bfe.u32 %r2100, %r2097, 16, 6; | |
or.b32 %r4273, %r2099, %r2100; | |
st.local.u32 [%rd1+308], %r4273; | |
setp.le.u32 %p74, %r471, %r4273; | |
mov.u32 %r4272, %r471; | |
@%p74 bra BB0_148; | |
st.local.u32 [%rd1+304], %r4273; | |
st.local.u32 [%rd1+308], %r471; | |
mov.u32 %r3995, %r4273; | |
mov.u32 %r4273, %r471; | |
mov.u32 %r4272, %r3995; | |
BB0_148: | |
mov.u32 %r4268, %r4272; | |
mov.u32 %r4269, %r4273; | |
bfe.u32 %r2101, %r470, 22, 6; | |
mul.lo.s64 %rd695, %rd39, 1792; | |
add.s64 %rd696, %rd136, %rd695; | |
mul.wide.u32 %rd697, %r2101, 28; | |
add.s64 %rd698, %rd696, %rd697; | |
ld.global.u32 %r2102, [%rd698]; | |
and.b32 %r2103, %r2102, 65535; | |
bfe.u32 %r2104, %r2102, 16, 6; | |
mul.wide.u32 %rd699, %r2103, 1792; | |
add.s64 %rd700, %rd135, %rd699; | |
mul.wide.u32 %rd701, %r2104, 28; | |
add.s64 %rd702, %rd700, %rd701; | |
ld.global.u32 %r2105, [%rd702]; | |
and.b32 %r2106, %r2105, 65535; | |
shl.b32 %r2107, %r2106, 6; | |
bfe.u32 %r2108, %r2105, 16, 6; | |
or.b32 %r475, %r2107, %r2108; | |
st.local.u32 [%rd1+312], %r475; | |
bfe.u32 %r2109, %r2102, 22, 6; | |
mul.wide.u32 %rd703, %r2109, 28; | |
add.s64 %rd704, %rd700, %rd703; | |
ld.global.u32 %r2110, [%rd704]; | |
and.b32 %r2111, %r2110, 65535; | |
shl.b32 %r2112, %r2111, 6; | |
bfe.u32 %r2113, %r2110, 16, 6; | |
or.b32 %r4275, %r2112, %r2113; | |
st.local.u32 [%rd1+316], %r4275; | |
setp.le.u32 %p75, %r475, %r4275; | |
mov.u32 %r4274, %r475; | |
@%p75 bra BB0_150; | |
st.local.u32 [%rd1+312], %r4275; | |
st.local.u32 [%rd1+316], %r475; | |
mov.u32 %r4001, %r4275; | |
mov.u32 %r4275, %r475; | |
mov.u32 %r4274, %r4001; | |
BB0_150: | |
mov.u32 %r478, %r4274; | |
mov.u32 %r477, %r4275; | |
setp.le.u32 %p76, %r4268, %r478; | |
mov.u32 %r4270, %r478; | |
mov.u32 %r4271, %r477; | |
@%p76 bra BB0_152; | |
st.local.u32 [%rd1+304], %r478; | |
st.local.u32 [%rd1+312], %r4268; | |
st.local.u32 [%rd1+308], %r477; | |
st.local.u32 [%rd1+316], %r4269; | |
mov.u32 %r3998, %r4269; | |
mov.u32 %r4000, %r4268; | |
mov.u32 %r4269, %r477; | |
mov.u32 %r4268, %r478; | |
mov.u32 %r4270, %r4000; | |
mov.u32 %r4271, %r3998; | |
BB0_152: | |
mov.u32 %r482, %r4268; | |
mov.u32 %r481, %r4269; | |
mov.u32 %r480, %r4270; | |
mov.u32 %r479, %r4271; | |
setp.le.u32 %p77, %r4252, %r482; | |
mov.u32 %r4256, %r482; | |
mov.u32 %r4257, %r481; | |
mov.u32 %r4258, %r480; | |
mov.u32 %r4259, %r479; | |
@%p77 bra BB0_154; | |
st.local.u32 [%rd1+288], %r482; | |
st.local.u32 [%rd1+304], %r4252; | |
st.local.u32 [%rd1+292], %r481; | |
st.local.u32 [%rd1+308], %r4253; | |
st.local.u32 [%rd1+296], %r480; | |
st.local.u32 [%rd1+312], %r4254; | |
st.local.u32 [%rd1+300], %r479; | |
st.local.u32 [%rd1+316], %r4255; | |
mov.u32 %r3988, %r4255; | |
mov.u32 %r3990, %r4254; | |
mov.u32 %r3992, %r4253; | |
mov.u32 %r3994, %r4252; | |
mov.u32 %r4255, %r479; | |
mov.u32 %r4254, %r480; | |
mov.u32 %r4253, %r481; | |
mov.u32 %r4252, %r482; | |
mov.u32 %r4256, %r3994; | |
mov.u32 %r4257, %r3992; | |
mov.u32 %r4258, %r3990; | |
mov.u32 %r4259, %r3988; | |
BB0_154: | |
mov.u32 %r490, %r4252; | |
mov.u32 %r489, %r4253; | |
mov.u32 %r488, %r4254; | |
mov.u32 %r487, %r4255; | |
mov.u32 %r486, %r4256; | |
mov.u32 %r485, %r4257; | |
mov.u32 %r484, %r4258; | |
mov.u32 %r483, %r4259; | |
setp.le.u32 %p78, %r4212, %r490; | |
mov.u32 %r4220, %r490; | |
mov.u32 %r4221, %r489; | |
mov.u32 %r4222, %r488; | |
mov.u32 %r4223, %r487; | |
mov.u32 %r4224, %r486; | |
mov.u32 %r4225, %r485; | |
mov.u32 %r4226, %r484; | |
mov.u32 %r4227, %r483; | |
@%p78 bra BB0_156; | |
st.local.u32 [%rd1+256], %r490; | |
st.local.u32 [%rd1+288], %r4212; | |
st.local.u32 [%rd1+260], %r489; | |
st.local.u32 [%rd1+292], %r4213; | |
st.local.u32 [%rd1+264], %r488; | |
st.local.u32 [%rd1+296], %r4214; | |
st.local.u32 [%rd1+268], %r487; | |
st.local.u32 [%rd1+300], %r4215; | |
st.local.u32 [%rd1+272], %r486; | |
st.local.u32 [%rd1+304], %r4216; | |
st.local.u32 [%rd1+276], %r485; | |
st.local.u32 [%rd1+308], %r4217; | |
st.local.u32 [%rd1+280], %r484; | |
st.local.u32 [%rd1+312], %r4218; | |
st.local.u32 [%rd1+284], %r483; | |
st.local.u32 [%rd1+316], %r4219; | |
mov.u32 %r3960, %r4219; | |
mov.u32 %r3962, %r4218; | |
mov.u32 %r3964, %r4217; | |
mov.u32 %r3966, %r4216; | |
mov.u32 %r3968, %r4215; | |
mov.u32 %r3970, %r4214; | |
mov.u32 %r3972, %r4213; | |
mov.u32 %r3974, %r4212; | |
mov.u32 %r4219, %r483; | |
mov.u32 %r4218, %r484; | |
mov.u32 %r4217, %r485; | |
mov.u32 %r4216, %r486; | |
mov.u32 %r4215, %r487; | |
mov.u32 %r4214, %r488; | |
mov.u32 %r4213, %r489; | |
mov.u32 %r4212, %r490; | |
mov.u32 %r4220, %r3974; | |
mov.u32 %r4221, %r3972; | |
mov.u32 %r4222, %r3970; | |
mov.u32 %r4223, %r3968; | |
mov.u32 %r4224, %r3966; | |
mov.u32 %r4225, %r3964; | |
mov.u32 %r4226, %r3962; | |
mov.u32 %r4227, %r3960; | |
BB0_156: | |
mov.u32 %r506, %r4212; | |
mul.lo.s64 %rd705, %rd32, 1792; | |
add.s64 %rd706, %rd3, %rd705; | |
bfe.u32 %r2114, %r419, 22, 6; | |
mul.wide.u32 %rd707, %r2114, 28; | |
add.s64 %rd708, %rd706, %rd707; | |
ld.global.u32 %r507, [%rd708+-4]; | |
and.b32 %r2115, %r507, 65535; | |
mul.wide.u32 %rd709, %r2115, 1792; | |
add.s64 %rd710, %rd136, %rd709; | |
bfe.u32 %r2116, %r507, 16, 6; | |
mul.wide.u32 %rd711, %r2116, 28; | |
add.s64 %rd712, %rd710, %rd711; | |
ld.global.u32 %r508, [%rd712+4]; | |
and.b32 %r2117, %r508, 65535; | |
mul.wide.u32 %rd713, %r2117, 1792; | |
add.s64 %rd714, %rd3, %rd713; | |
cvt.u64.u32 %rd40, %r2115; | |
cvt.u64.u32 %rd41, %r2117; | |
bfe.u32 %r2118, %r508, 16, 6; | |
mul.wide.u32 %rd715, %r2118, 28; | |
add.s64 %rd716, %rd714, %rd715; | |
ld.global.u32 %r509, [%rd716+-8]; | |
and.b32 %r2119, %r509, 65535; | |
cvt.u64.u32 %rd42, %r2119; | |
bfe.u32 %r2120, %r509, 16, 6; | |
mul.wide.u32 %rd717, %r2119, 1792; | |
add.s64 %rd718, %rd136, %rd717; | |
mul.wide.u32 %rd719, %r2120, 28; | |
add.s64 %rd720, %rd718, %rd719; | |
ld.global.u32 %r2121, [%rd720]; | |
and.b32 %r2122, %r2121, 65535; | |
bfe.u32 %r2123, %r2121, 16, 6; | |
mul.wide.u32 %rd721, %r2122, 1792; | |
add.s64 %rd722, %rd135, %rd721; | |
mul.wide.u32 %rd723, %r2123, 28; | |
add.s64 %rd724, %rd722, %rd723; | |
ld.global.u32 %r2124, [%rd724]; | |
and.b32 %r2125, %r2124, 65535; | |
shl.b32 %r2126, %r2125, 6; | |
bfe.u32 %r2127, %r2124, 16, 6; | |
or.b32 %r510, %r2126, %r2127; | |
st.local.u32 [%rd1+320], %r510; | |
bfe.u32 %r2128, %r2121, 22, 6; | |
mul.wide.u32 %rd725, %r2128, 28; | |
add.s64 %rd726, %rd722, %rd725; | |
ld.global.u32 %r2129, [%rd726]; | |
and.b32 %r2130, %r2129, 65535; | |
shl.b32 %r2131, %r2130, 6; | |
bfe.u32 %r2132, %r2129, 16, 6; | |
or.b32 %r4177, %r2131, %r2132; | |
st.local.u32 [%rd1+324], %r4177; | |
setp.le.u32 %p79, %r510, %r4177; | |
mov.u32 %r4176, %r510; | |
@%p79 bra BB0_158; | |
st.local.u32 [%rd1+320], %r4177; | |
st.local.u32 [%rd1+324], %r510; | |
mov.u32 %r4032, %r4177; | |
mov.u32 %r4177, %r510; | |
mov.u32 %r4176, %r4032; | |
BB0_158: | |
mov.u32 %r4172, %r4176; | |
mov.u32 %r4173, %r4177; | |
bfe.u32 %r2133, %r509, 22, 6; | |
mul.lo.s64 %rd727, %rd42, 1792; | |
add.s64 %rd728, %rd136, %rd727; | |
mul.wide.u32 %rd729, %r2133, 28; | |
add.s64 %rd730, %rd728, %rd729; | |
ld.global.u32 %r2134, [%rd730]; | |
and.b32 %r2135, %r2134, 65535; | |
bfe.u32 %r2136, %r2134, 16, 6; | |
mul.wide.u32 %rd731, %r2135, 1792; | |
add.s64 %rd732, %rd135, %rd731; | |
mul.wide.u32 %rd733, %r2136, 28; | |
add.s64 %rd734, %rd732, %rd733; | |
ld.global.u32 %r2137, [%rd734]; | |
and.b32 %r2138, %r2137, 65535; | |
shl.b32 %r2139, %r2138, 6; | |
bfe.u32 %r2140, %r2137, 16, 6; | |
or.b32 %r514, %r2139, %r2140; | |
st.local.u32 [%rd1+328], %r514; | |
bfe.u32 %r2141, %r2134, 22, 6; | |
mul.wide.u32 %rd735, %r2141, 28; | |
add.s64 %rd736, %rd732, %rd735; | |
ld.global.u32 %r2142, [%rd736]; | |
and.b32 %r2143, %r2142, 65535; | |
shl.b32 %r2144, %r2143, 6; | |
bfe.u32 %r2145, %r2142, 16, 6; | |
or.b32 %r4179, %r2144, %r2145; | |
st.local.u32 [%rd1+332], %r4179; | |
setp.le.u32 %p80, %r514, %r4179; | |
mov.u32 %r4178, %r514; | |
@%p80 bra BB0_160; | |
st.local.u32 [%rd1+328], %r4179; | |
st.local.u32 [%rd1+332], %r514; | |
mov.u32 %r4038, %r4179; | |
mov.u32 %r4179, %r514; | |
mov.u32 %r4178, %r4038; | |
BB0_160: | |
mov.u32 %r517, %r4178; | |
mov.u32 %r516, %r4179; | |
setp.le.u32 %p81, %r4172, %r517; | |
mov.u32 %r4174, %r517; | |
mov.u32 %r4175, %r516; | |
@%p81 bra BB0_162; | |
st.local.u32 [%rd1+320], %r517; | |
st.local.u32 [%rd1+328], %r4172; | |
st.local.u32 [%rd1+324], %r516; | |
st.local.u32 [%rd1+332], %r4173; | |
mov.u32 %r4035, %r4173; | |
mov.u32 %r4037, %r4172; | |
mov.u32 %r4173, %r516; | |
mov.u32 %r4172, %r517; | |
mov.u32 %r4174, %r4037; | |
mov.u32 %r4175, %r4035; | |
BB0_162: | |
mov.u32 %r4164, %r4172; | |
mov.u32 %r4165, %r4173; | |
mov.u32 %r4166, %r4174; | |
mov.u32 %r4167, %r4175; | |
mul.lo.s64 %rd737, %rd41, 1792; | |
add.s64 %rd738, %rd3, %rd737; | |
bfe.u32 %r2146, %r508, 22, 6; | |
mul.wide.u32 %rd739, %r2146, 28; | |
add.s64 %rd740, %rd738, %rd739; | |
ld.global.u32 %r522, [%rd740+-8]; | |
and.b32 %r2147, %r522, 65535; | |
cvt.u64.u32 %rd43, %r2147; | |
bfe.u32 %r2148, %r522, 16, 6; | |
mul.wide.u32 %rd741, %r2147, 1792; | |
add.s64 %rd742, %rd136, %rd741; | |
mul.wide.u32 %rd743, %r2148, 28; | |
add.s64 %rd744, %rd742, %rd743; | |
ld.global.u32 %r2149, [%rd744]; | |
and.b32 %r2150, %r2149, 65535; | |
bfe.u32 %r2151, %r2149, 16, 6; | |
mul.wide.u32 %rd745, %r2150, 1792; | |
add.s64 %rd746, %rd135, %rd745; | |
mul.wide.u32 %rd747, %r2151, 28; | |
add.s64 %rd748, %rd746, %rd747; | |
ld.global.u32 %r2152, [%rd748]; | |
and.b32 %r2153, %r2152, 65535; | |
shl.b32 %r2154, %r2153, 6; | |
bfe.u32 %r2155, %r2152, 16, 6; | |
or.b32 %r523, %r2154, %r2155; | |
st.local.u32 [%rd1+336], %r523; | |
bfe.u32 %r2156, %r2149, 22, 6; | |
mul.wide.u32 %rd749, %r2156, 28; | |
add.s64 %rd750, %rd746, %rd749; | |
ld.global.u32 %r2157, [%rd750]; | |
and.b32 %r2158, %r2157, 65535; | |
shl.b32 %r2159, %r2158, 6; | |
bfe.u32 %r2160, %r2157, 16, 6; | |
or.b32 %r4185, %r2159, %r2160; | |
st.local.u32 [%rd1+340], %r4185; | |
setp.le.u32 %p82, %r523, %r4185; | |
mov.u32 %r4184, %r523; | |
@%p82 bra BB0_164; | |
st.local.u32 [%rd1+336], %r4185; | |
st.local.u32 [%rd1+340], %r523; | |
mov.u32 %r4052, %r4185; | |
mov.u32 %r4185, %r523; | |
mov.u32 %r4184, %r4052; | |
BB0_164: | |
mov.u32 %r4180, %r4184; | |
mov.u32 %r4181, %r4185; | |
bfe.u32 %r2161, %r522, 22, 6; | |
mul.lo.s64 %rd751, %rd43, 1792; | |
add.s64 %rd752, %rd136, %rd751; | |
mul.wide.u32 %rd753, %r2161, 28; | |
add.s64 %rd754, %rd752, %rd753; | |
ld.global.u32 %r2162, [%rd754]; | |
and.b32 %r2163, %r2162, 65535; | |
bfe.u32 %r2164, %r2162, 16, 6; | |
mul.wide.u32 %rd755, %r2163, 1792; | |
add.s64 %rd756, %rd135, %rd755; | |
mul.wide.u32 %rd757, %r2164, 28; | |
add.s64 %rd758, %rd756, %rd757; | |
ld.global.u32 %r2165, [%rd758]; | |
and.b32 %r2166, %r2165, 65535; | |
shl.b32 %r2167, %r2166, 6; | |
bfe.u32 %r2168, %r2165, 16, 6; | |
or.b32 %r527, %r2167, %r2168; | |
st.local.u32 [%rd1+344], %r527; | |
bfe.u32 %r2169, %r2162, 22, 6; | |
mul.wide.u32 %rd759, %r2169, 28; | |
add.s64 %rd760, %rd756, %rd759; | |
ld.global.u32 %r2170, [%rd760]; | |
and.b32 %r2171, %r2170, 65535; | |
shl.b32 %r2172, %r2171, 6; | |
bfe.u32 %r2173, %r2170, 16, 6; | |
or.b32 %r4187, %r2172, %r2173; | |
st.local.u32 [%rd1+348], %r4187; | |
setp.le.u32 %p83, %r527, %r4187; | |
mov.u32 %r4186, %r527; | |
@%p83 bra BB0_166; | |
st.local.u32 [%rd1+344], %r4187; | |
st.local.u32 [%rd1+348], %r527; | |
mov.u32 %r4058, %r4187; | |
mov.u32 %r4187, %r527; | |
mov.u32 %r4186, %r4058; | |
BB0_166: | |
mov.u32 %r530, %r4186; | |
mov.u32 %r529, %r4187; | |
setp.le.u32 %p84, %r4180, %r530; | |
mov.u32 %r4182, %r530; | |
mov.u32 %r4183, %r529; | |
@%p84 bra BB0_168; | |
st.local.u32 [%rd1+336], %r530; | |
st.local.u32 [%rd1+344], %r4180; | |
st.local.u32 [%rd1+340], %r529; | |
st.local.u32 [%rd1+348], %r4181; | |
mov.u32 %r4055, %r4181; | |
mov.u32 %r4057, %r4180; | |
mov.u32 %r4181, %r529; | |
mov.u32 %r4180, %r530; | |
mov.u32 %r4182, %r4057; | |
mov.u32 %r4183, %r4055; | |
BB0_168: | |
mov.u32 %r534, %r4180; | |
mov.u32 %r533, %r4181; | |
mov.u32 %r532, %r4182; | |
mov.u32 %r531, %r4183; | |
setp.le.u32 %p85, %r4164, %r534; | |
mov.u32 %r4168, %r534; | |
mov.u32 %r4169, %r533; | |
mov.u32 %r4170, %r532; | |
mov.u32 %r4171, %r531; | |
@%p85 bra BB0_170; | |
st.local.u32 [%rd1+320], %r534; | |
st.local.u32 [%rd1+336], %r4164; | |
st.local.u32 [%rd1+324], %r533; | |
st.local.u32 [%rd1+340], %r4165; | |
st.local.u32 [%rd1+328], %r532; | |
st.local.u32 [%rd1+344], %r4166; | |
st.local.u32 [%rd1+332], %r531; | |
st.local.u32 [%rd1+348], %r4167; | |
mov.u32 %r4045, %r4167; | |
mov.u32 %r4047, %r4166; | |
mov.u32 %r4049, %r4165; | |
mov.u32 %r4051, %r4164; | |
mov.u32 %r4167, %r531; | |
mov.u32 %r4166, %r532; | |
mov.u32 %r4165, %r533; | |
mov.u32 %r4164, %r534; | |
mov.u32 %r4168, %r4051; | |
mov.u32 %r4169, %r4049; | |
mov.u32 %r4170, %r4047; | |
mov.u32 %r4171, %r4045; | |
BB0_170: | |
mov.u32 %r4148, %r4164; | |
mov.u32 %r4149, %r4165; | |
mov.u32 %r4150, %r4166; | |
mov.u32 %r4151, %r4167; | |
mov.u32 %r4152, %r4168; | |
mov.u32 %r4153, %r4169; | |
mov.u32 %r4154, %r4170; | |
mov.u32 %r4155, %r4171; | |
mul.lo.s64 %rd761, %rd40, 1792; | |
add.s64 %rd762, %rd136, %rd761; | |
bfe.u32 %r2174, %r507, 22, 6; | |
mul.wide.u32 %rd763, %r2174, 28; | |
add.s64 %rd764, %rd762, %rd763; | |
ld.global.u32 %r543, [%rd764+4]; | |
and.b32 %r2175, %r543, 65535; | |
mul.wide.u32 %rd765, %r2175, 1792; | |
add.s64 %rd766, %rd3, %rd765; | |
cvt.u64.u32 %rd44, %r2175; | |
bfe.u32 %r2176, %r543, 16, 6; | |
mul.wide.u32 %rd767, %r2176, 28; | |
add.s64 %rd768, %rd766, %rd767; | |
ld.global.u32 %r544, [%rd768+-8]; | |
and.b32 %r2177, %r544, 65535; | |
cvt.u64.u32 %rd45, %r2177; | |
bfe.u32 %r2178, %r544, 16, 6; | |
mul.wide.u32 %rd769, %r2177, 1792; | |
add.s64 %rd770, %rd136, %rd769; | |
mul.wide.u32 %rd771, %r2178, 28; | |
add.s64 %rd772, %rd770, %rd771; | |
ld.global.u32 %r2179, [%rd772]; | |
and.b32 %r2180, %r2179, 65535; | |
bfe.u32 %r2181, %r2179, 16, 6; | |
mul.wide.u32 %rd773, %r2180, 1792; | |
add.s64 %rd774, %rd135, %rd773; | |
mul.wide.u32 %rd775, %r2181, 28; | |
add.s64 %rd776, %rd774, %rd775; | |
ld.global.u32 %r2182, [%rd776]; | |
and.b32 %r2183, %r2182, 65535; | |
shl.b32 %r2184, %r2183, 6; | |
bfe.u32 %r2185, %r2182, 16, 6; | |
or.b32 %r545, %r2184, %r2185; | |
st.local.u32 [%rd1+352], %r545; | |
bfe.u32 %r2186, %r2179, 22, 6; | |
mul.wide.u32 %rd777, %r2186, 28; | |
add.s64 %rd778, %rd774, %rd777; | |
ld.global.u32 %r2187, [%rd778]; | |
and.b32 %r2188, %r2187, 65535; | |
shl.b32 %r2189, %r2188, 6; | |
bfe.u32 %r2190, %r2187, 16, 6; | |
or.b32 %r4201, %r2189, %r2190; | |
st.local.u32 [%rd1+356], %r4201; | |
setp.le.u32 %p86, %r545, %r4201; | |
mov.u32 %r4200, %r545; | |
@%p86 bra BB0_172; | |
st.local.u32 [%rd1+352], %r4201; | |
st.local.u32 [%rd1+356], %r545; | |
mov.u32 %r4088, %r4201; | |
mov.u32 %r4201, %r545; | |
mov.u32 %r4200, %r4088; | |
BB0_172: | |
mov.u32 %r4196, %r4200; | |
mov.u32 %r4197, %r4201; | |
bfe.u32 %r2191, %r544, 22, 6; | |
mul.lo.s64 %rd779, %rd45, 1792; | |
add.s64 %rd780, %rd136, %rd779; | |
mul.wide.u32 %rd781, %r2191, 28; | |
add.s64 %rd782, %rd780, %rd781; | |
ld.global.u32 %r2192, [%rd782]; | |
and.b32 %r2193, %r2192, 65535; | |
bfe.u32 %r2194, %r2192, 16, 6; | |
mul.wide.u32 %rd783, %r2193, 1792; | |
add.s64 %rd784, %rd135, %rd783; | |
mul.wide.u32 %rd785, %r2194, 28; | |
add.s64 %rd786, %rd784, %rd785; | |
ld.global.u32 %r2195, [%rd786]; | |
and.b32 %r2196, %r2195, 65535; | |
shl.b32 %r2197, %r2196, 6; | |
bfe.u32 %r2198, %r2195, 16, 6; | |
or.b32 %r549, %r2197, %r2198; | |
st.local.u32 [%rd1+360], %r549; | |
bfe.u32 %r2199, %r2192, 22, 6; | |
mul.wide.u32 %rd787, %r2199, 28; | |
add.s64 %rd788, %rd784, %rd787; | |
ld.global.u32 %r2200, [%rd788]; | |
and.b32 %r2201, %r2200, 65535; | |
shl.b32 %r2202, %r2201, 6; | |
bfe.u32 %r2203, %r2200, 16, 6; | |
or.b32 %r4203, %r2202, %r2203; | |
st.local.u32 [%rd1+364], %r4203; | |
setp.le.u32 %p87, %r549, %r4203; | |
mov.u32 %r4202, %r549; | |
@%p87 bra BB0_174; | |
st.local.u32 [%rd1+360], %r4203; | |
st.local.u32 [%rd1+364], %r549; | |
mov.u32 %r4094, %r4203; | |
mov.u32 %r4203, %r549; | |
mov.u32 %r4202, %r4094; | |
BB0_174: | |
mov.u32 %r552, %r4202; | |
mov.u32 %r551, %r4203; | |
setp.le.u32 %p88, %r4196, %r552; | |
mov.u32 %r4198, %r552; | |
mov.u32 %r4199, %r551; | |
@%p88 bra BB0_176; | |
st.local.u32 [%rd1+352], %r552; | |
st.local.u32 [%rd1+360], %r4196; | |
st.local.u32 [%rd1+356], %r551; | |
st.local.u32 [%rd1+364], %r4197; | |
mov.u32 %r4091, %r4197; | |
mov.u32 %r4093, %r4196; | |
mov.u32 %r4197, %r551; | |
mov.u32 %r4196, %r552; | |
mov.u32 %r4198, %r4093; | |
mov.u32 %r4199, %r4091; | |
BB0_176: | |
mov.u32 %r4188, %r4196; | |
mov.u32 %r4189, %r4197; | |
mov.u32 %r4190, %r4198; | |
mov.u32 %r4191, %r4199; | |
mul.lo.s64 %rd789, %rd44, 1792; | |
add.s64 %rd790, %rd3, %rd789; | |
bfe.u32 %r2204, %r543, 22, 6; | |
mul.wide.u32 %rd791, %r2204, 28; | |
add.s64 %rd792, %rd790, %rd791; | |
ld.global.u32 %r557, [%rd792+-8]; | |
and.b32 %r2205, %r557, 65535; | |
cvt.u64.u32 %rd46, %r2205; | |
bfe.u32 %r2206, %r557, 16, 6; | |
mul.wide.u32 %rd793, %r2205, 1792; | |
add.s64 %rd794, %rd136, %rd793; | |
mul.wide.u32 %rd795, %r2206, 28; | |
add.s64 %rd796, %rd794, %rd795; | |
ld.global.u32 %r2207, [%rd796]; | |
and.b32 %r2208, %r2207, 65535; | |
bfe.u32 %r2209, %r2207, 16, 6; | |
mul.wide.u32 %rd797, %r2208, 1792; | |
add.s64 %rd798, %rd135, %rd797; | |
mul.wide.u32 %rd799, %r2209, 28; | |
add.s64 %rd800, %rd798, %rd799; | |
ld.global.u32 %r2210, [%rd800]; | |
and.b32 %r2211, %r2210, 65535; | |
shl.b32 %r2212, %r2211, 6; | |
bfe.u32 %r2213, %r2210, 16, 6; | |
or.b32 %r558, %r2212, %r2213; | |
st.local.u32 [%rd1+368], %r558; | |
bfe.u32 %r2214, %r2207, 22, 6; | |
mul.wide.u32 %rd801, %r2214, 28; | |
add.s64 %rd802, %rd798, %rd801; | |
ld.global.u32 %r2215, [%rd802]; | |
and.b32 %r2216, %r2215, 65535; | |
shl.b32 %r2217, %r2216, 6; | |
bfe.u32 %r2218, %r2215, 16, 6; | |
or.b32 %r4209, %r2217, %r2218; | |
st.local.u32 [%rd1+372], %r4209; | |
setp.le.u32 %p89, %r558, %r4209; | |
mov.u32 %r4208, %r558; | |
@%p89 bra BB0_178; | |
st.local.u32 [%rd1+368], %r4209; | |
st.local.u32 [%rd1+372], %r558; | |
mov.u32 %r4108, %r4209; | |
mov.u32 %r4209, %r558; | |
mov.u32 %r4208, %r4108; | |
BB0_178: | |
mov.u32 %r4204, %r4208; | |
mov.u32 %r4205, %r4209; | |
bfe.u32 %r2219, %r557, 22, 6; | |
mul.lo.s64 %rd803, %rd46, 1792; | |
add.s64 %rd804, %rd136, %rd803; | |
mul.wide.u32 %rd805, %r2219, 28; | |
add.s64 %rd806, %rd804, %rd805; | |
ld.global.u32 %r2220, [%rd806]; | |
and.b32 %r2221, %r2220, 65535; | |
bfe.u32 %r2222, %r2220, 16, 6; | |
mul.wide.u32 %rd807, %r2221, 1792; | |
add.s64 %rd808, %rd135, %rd807; | |
mul.wide.u32 %rd809, %r2222, 28; | |
add.s64 %rd810, %rd808, %rd809; | |
ld.global.u32 %r2223, [%rd810]; | |
and.b32 %r2224, %r2223, 65535; | |
shl.b32 %r2225, %r2224, 6; | |
bfe.u32 %r2226, %r2223, 16, 6; | |
or.b32 %r562, %r2225, %r2226; | |
st.local.u32 [%rd1+376], %r562; | |
bfe.u32 %r2227, %r2220, 22, 6; | |
mul.wide.u32 %rd811, %r2227, 28; | |
add.s64 %rd812, %rd808, %rd811; | |
ld.global.u32 %r2228, [%rd812]; | |
and.b32 %r2229, %r2228, 65535; | |
shl.b32 %r2230, %r2229, 6; | |
bfe.u32 %r2231, %r2228, 16, 6; | |
or.b32 %r4211, %r2230, %r2231; | |
st.local.u32 [%rd1+380], %r4211; | |
setp.le.u32 %p90, %r562, %r4211; | |
mov.u32 %r4210, %r562; | |
@%p90 bra BB0_180; | |
st.local.u32 [%rd1+376], %r4211; | |
st.local.u32 [%rd1+380], %r562; | |
mov.u32 %r4114, %r4211; | |
mov.u32 %r4211, %r562; | |
mov.u32 %r4210, %r4114; | |
BB0_180: | |
mov.u32 %r565, %r4210; | |
mov.u32 %r564, %r4211; | |
setp.le.u32 %p91, %r4204, %r565; | |
mov.u32 %r4206, %r565; | |
mov.u32 %r4207, %r564; | |
@%p91 bra BB0_182; | |
st.local.u32 [%rd1+368], %r565; | |
st.local.u32 [%rd1+376], %r4204; | |
st.local.u32 [%rd1+372], %r564; | |
st.local.u32 [%rd1+380], %r4205; | |
mov.u32 %r4111, %r4205; | |
mov.u32 %r4113, %r4204; | |
mov.u32 %r4205, %r564; | |
mov.u32 %r4204, %r565; | |
mov.u32 %r4206, %r4113; | |
mov.u32 %r4207, %r4111; | |
BB0_182: | |
mov.u32 %r569, %r4204; | |
mov.u32 %r568, %r4205; | |
mov.u32 %r567, %r4206; | |
mov.u32 %r566, %r4207; | |
setp.le.u32 %p92, %r4188, %r569; | |
mov.u32 %r4192, %r569; | |
mov.u32 %r4193, %r568; | |
mov.u32 %r4194, %r567; | |
mov.u32 %r4195, %r566; | |
@%p92 bra BB0_184; | |
st.local.u32 [%rd1+352], %r569; | |
st.local.u32 [%rd1+368], %r4188; | |
st.local.u32 [%rd1+356], %r568; | |
st.local.u32 [%rd1+372], %r4189; | |
st.local.u32 [%rd1+360], %r567; | |
st.local.u32 [%rd1+376], %r4190; | |
st.local.u32 [%rd1+364], %r566; | |
st.local.u32 [%rd1+380], %r4191; | |
mov.u32 %r4101, %r4191; | |
mov.u32 %r4103, %r4190; | |
mov.u32 %r4105, %r4189; | |
mov.u32 %r4107, %r4188; | |
mov.u32 %r4191, %r566; | |
mov.u32 %r4190, %r567; | |
mov.u32 %r4189, %r568; | |
mov.u32 %r4188, %r569; | |
mov.u32 %r4192, %r4107; | |
mov.u32 %r4193, %r4105; | |
mov.u32 %r4194, %r4103; | |
mov.u32 %r4195, %r4101; | |
BB0_184: | |
mov.u32 %r577, %r4188; | |
mov.u32 %r576, %r4189; | |
mov.u32 %r575, %r4190; | |
mov.u32 %r574, %r4191; | |
mov.u32 %r573, %r4192; | |
mov.u32 %r572, %r4193; | |
mov.u32 %r571, %r4194; | |
mov.u32 %r570, %r4195; | |
setp.le.u32 %p93, %r4148, %r577; | |
mov.u32 %r4156, %r577; | |
mov.u32 %r4157, %r576; | |
mov.u32 %r4158, %r575; | |
mov.u32 %r4159, %r574; | |
mov.u32 %r4160, %r573; | |
mov.u32 %r4161, %r572; | |
mov.u32 %r4162, %r571; | |
mov.u32 %r4163, %r570; | |
@%p93 bra BB0_186; | |
st.local.u32 [%rd1+320], %r577; | |
st.local.u32 [%rd1+352], %r4148; | |
st.local.u32 [%rd1+324], %r576; | |
st.local.u32 [%rd1+356], %r4149; | |
st.local.u32 [%rd1+328], %r575; | |
st.local.u32 [%rd1+360], %r4150; | |
st.local.u32 [%rd1+332], %r574; | |
st.local.u32 [%rd1+364], %r4151; | |
st.local.u32 [%rd1+336], %r573; | |
st.local.u32 [%rd1+368], %r4152; | |
st.local.u32 [%rd1+340], %r572; | |
st.local.u32 [%rd1+372], %r4153; | |
st.local.u32 [%rd1+344], %r571; | |
st.local.u32 [%rd1+376], %r4154; | |
st.local.u32 [%rd1+348], %r570; | |
st.local.u32 [%rd1+380], %r4155; | |
mov.u32 %r4073, %r4155; | |
mov.u32 %r4075, %r4154; | |
mov.u32 %r4077, %r4153; | |
mov.u32 %r4079, %r4152; | |
mov.u32 %r4081, %r4151; | |
mov.u32 %r4083, %r4150; | |
mov.u32 %r4085, %r4149; | |
mov.u32 %r4087, %r4148; | |
mov.u32 %r4155, %r570; | |
mov.u32 %r4154, %r571; | |
mov.u32 %r4153, %r572; | |
mov.u32 %r4152, %r573; | |
mov.u32 %r4151, %r574; | |
mov.u32 %r4150, %r575; | |
mov.u32 %r4149, %r576; | |
mov.u32 %r4148, %r577; | |
mov.u32 %r4156, %r4087; | |
mov.u32 %r4157, %r4085; | |
mov.u32 %r4158, %r4083; | |
mov.u32 %r4159, %r4081; | |
mov.u32 %r4160, %r4079; | |
mov.u32 %r4161, %r4077; | |
mov.u32 %r4162, %r4075; | |
mov.u32 %r4163, %r4073; | |
BB0_186: | |
mov.u32 %r593, %r4148; | |
setp.le.u32 %p94, %r506, %r593; | |
mov.u32 %r4147, %r506; | |
@%p94 bra BB0_188; | |
st.local.u32 [%rd1+256], %r593; | |
st.local.u32 [%rd1+320], %r506; | |
st.local.u32 [%rd1+260], %r4149; | |
st.local.u32 [%rd1+324], %r4213; | |
st.local.u32 [%rd1+264], %r4150; | |
st.local.u32 [%rd1+328], %r4214; | |
st.local.u32 [%rd1+268], %r4151; | |
st.local.u32 [%rd1+332], %r4215; | |
st.local.u32 [%rd1+272], %r4152; | |
st.local.u32 [%rd1+336], %r4216; | |
st.local.u32 [%rd1+276], %r4153; | |
st.local.u32 [%rd1+340], %r4217; | |
st.local.u32 [%rd1+280], %r4154; | |
st.local.u32 [%rd1+344], %r4218; | |
st.local.u32 [%rd1+284], %r4155; | |
st.local.u32 [%rd1+348], %r4219; | |
st.local.u32 [%rd1+288], %r4156; | |
st.local.u32 [%rd1+352], %r4220; | |
st.local.u32 [%rd1+292], %r4157; | |
st.local.u32 [%rd1+356], %r4221; | |
st.local.u32 [%rd1+296], %r4158; | |
st.local.u32 [%rd1+360], %r4222; | |
st.local.u32 [%rd1+300], %r4159; | |
st.local.u32 [%rd1+364], %r4223; | |
st.local.u32 [%rd1+304], %r4160; | |
st.local.u32 [%rd1+368], %r4224; | |
st.local.u32 [%rd1+308], %r4161; | |
st.local.u32 [%rd1+372], %r4225; | |
st.local.u32 [%rd1+312], %r4162; | |
st.local.u32 [%rd1+376], %r4226; | |
st.local.u32 [%rd1+316], %r4163; | |
st.local.u32 [%rd1+380], %r4227; | |
mov.u32 %r4147, %r593; | |
BB0_188: | |
mov.u32 %r4146, %r4147; | |
mul.lo.s64 %rd814, %rd31, 1792; | |
add.s64 %rd815, %rd146, %rd814; | |
bfe.u32 %r2232, %r418, 22, 6; | |
mul.wide.u32 %rd816, %r2232, 28; | |
add.s64 %rd817, %rd815, %rd816; | |
ld.global.u32 %r595, [%rd817+4]; | |
and.b32 %r2233, %r595, 65535; | |
mul.wide.u32 %rd818, %r2233, 1792; | |
add.s64 %rd819, %rd3, %rd818; | |
bfe.u32 %r2234, %r595, 16, 6; | |
mul.wide.u32 %rd820, %r2234, 28; | |
add.s64 %rd821, %rd819, %rd820; | |
ld.global.u32 %r596, [%rd821+-4]; | |
and.b32 %r2235, %r596, 65535; | |
bfe.u32 %r2236, %r596, 16, 6; | |
mul.wide.u32 %rd822, %r2235, 1792; | |
add.s64 %rd823, %rd146, %rd822; | |
mul.wide.u32 %rd824, %r2236, 28; | |
add.s64 %rd825, %rd823, %rd824; | |
ld.global.u32 %r597, [%rd825]; | |
and.b32 %r2237, %r597, 65535; | |
mul.wide.u32 %rd826, %r2237, 1792; | |
add.s64 %rd827, %rd3, %rd826; | |
cvt.u64.u32 %rd47, %r2233; | |
cvt.u64.u32 %rd48, %r2235; | |
cvt.u64.u32 %rd49, %r2237; | |
bfe.u32 %r2238, %r597, 16, 6; | |
mul.wide.u32 %rd828, %r2238, 28; | |
add.s64 %rd829, %rd827, %rd828; | |
ld.global.u32 %r598, [%rd829+-8]; | |
and.b32 %r2239, %r598, 65535; | |
cvt.u64.u32 %rd50, %r2239; | |
bfe.u32 %r2240, %r598, 16, 6; | |
mul.wide.u32 %rd830, %r2239, 1792; | |
add.s64 %rd831, %rd136, %rd830; | |
mul.wide.u32 %rd832, %r2240, 28; | |
add.s64 %rd833, %rd831, %rd832; | |
ld.global.u32 %r2241, [%rd833]; | |
and.b32 %r2242, %r2241, 65535; | |
bfe.u32 %r2243, %r2241, 16, 6; | |
mul.wide.u32 %rd834, %r2242, 1792; | |
add.s64 %rd835, %rd135, %rd834; | |
mul.wide.u32 %rd836, %r2243, 28; | |
add.s64 %rd837, %rd835, %rd836; | |
ld.global.u32 %r2244, [%rd837]; | |
and.b32 %r2245, %r2244, 65535; | |
shl.b32 %r2246, %r2245, 6; | |
bfe.u32 %r2247, %r2244, 16, 6; | |
or.b32 %r599, %r2246, %r2247; | |
st.local.u32 [%rd1+384], %r599; | |
bfe.u32 %r2248, %r2241, 22, 6; | |
mul.wide.u32 %rd838, %r2248, 28; | |
add.s64 %rd839, %rd835, %rd838; | |
ld.global.u32 %r2249, [%rd839]; | |
and.b32 %r2250, %r2249, 65535; | |
shl.b32 %r2251, %r2250, 6; | |
bfe.u32 %r2252, %r2249, 16, 6; | |
or.b32 %r3883, %r2251, %r2252; | |
st.local.u32 [%rd1+388], %r3883; | |
setp.le.u32 %p95, %r599, %r3883; | |
mov.u32 %r3882, %r599; | |
@%p95 bra BB0_190; | |
st.local.u32 [%rd1+384], %r3883; | |
st.local.u32 [%rd1+388], %r599; | |
mov.u32 %r3563, %r3883; | |
mov.u32 %r3883, %r599; | |
mov.u32 %r3882, %r3563; | |
BB0_190: | |
mov.u32 %r3878, %r3882; | |
mov.u32 %r3879, %r3883; | |
bfe.u32 %r2253, %r598, 22, 6; | |
mul.lo.s64 %rd840, %rd50, 1792; | |
add.s64 %rd841, %rd136, %rd840; | |
mul.wide.u32 %rd842, %r2253, 28; | |
add.s64 %rd843, %rd841, %rd842; | |
ld.global.u32 %r2254, [%rd843]; | |
and.b32 %r2255, %r2254, 65535; | |
bfe.u32 %r2256, %r2254, 16, 6; | |
mul.wide.u32 %rd844, %r2255, 1792; | |
add.s64 %rd845, %rd135, %rd844; | |
mul.wide.u32 %rd846, %r2256, 28; | |
add.s64 %rd847, %rd845, %rd846; | |
ld.global.u32 %r2257, [%rd847]; | |
and.b32 %r2258, %r2257, 65535; | |
shl.b32 %r2259, %r2258, 6; | |
bfe.u32 %r2260, %r2257, 16, 6; | |
or.b32 %r603, %r2259, %r2260; | |
st.local.u32 [%rd1+392], %r603; | |
bfe.u32 %r2261, %r2254, 22, 6; | |
mul.wide.u32 %rd848, %r2261, 28; | |
add.s64 %rd849, %rd845, %rd848; | |
ld.global.u32 %r2262, [%rd849]; | |
and.b32 %r2263, %r2262, 65535; | |
shl.b32 %r2264, %r2263, 6; | |
bfe.u32 %r2265, %r2262, 16, 6; | |
or.b32 %r3885, %r2264, %r2265; | |
st.local.u32 [%rd1+396], %r3885; | |
setp.le.u32 %p96, %r603, %r3885; | |
mov.u32 %r3884, %r603; | |
@%p96 bra BB0_192; | |
st.local.u32 [%rd1+392], %r3885; | |
st.local.u32 [%rd1+396], %r603; | |
mov.u32 %r3569, %r3885; | |
mov.u32 %r3885, %r603; | |
mov.u32 %r3884, %r3569; | |
BB0_192: | |
mov.u32 %r606, %r3884; | |
mov.u32 %r605, %r3885; | |
setp.le.u32 %p97, %r3878, %r606; | |
mov.u32 %r3880, %r606; | |
mov.u32 %r3881, %r605; | |
@%p97 bra BB0_194; | |
st.local.u32 [%rd1+384], %r606; | |
st.local.u32 [%rd1+392], %r3878; | |
st.local.u32 [%rd1+388], %r605; | |
st.local.u32 [%rd1+396], %r3879; | |
mov.u32 %r3566, %r3879; | |
mov.u32 %r3568, %r3878; | |
mov.u32 %r3879, %r605; | |
mov.u32 %r3878, %r606; | |
mov.u32 %r3880, %r3568; | |
mov.u32 %r3881, %r3566; | |
BB0_194: | |
mov.u32 %r3870, %r3878; | |
mov.u32 %r3871, %r3879; | |
mov.u32 %r3872, %r3880; | |
mov.u32 %r3873, %r3881; | |
mul.lo.s64 %rd850, %rd49, 1792; | |
add.s64 %rd851, %rd3, %rd850; | |
bfe.u32 %r2266, %r597, 22, 6; | |
mul.wide.u32 %rd852, %r2266, 28; | |
add.s64 %rd853, %rd851, %rd852; | |
ld.global.u32 %r611, [%rd853+-8]; | |
and.b32 %r2267, %r611, 65535; | |
cvt.u64.u32 %rd51, %r2267; | |
bfe.u32 %r2268, %r611, 16, 6; | |
mul.wide.u32 %rd854, %r2267, 1792; | |
add.s64 %rd855, %rd136, %rd854; | |
mul.wide.u32 %rd856, %r2268, 28; | |
add.s64 %rd857, %rd855, %rd856; | |
ld.global.u32 %r2269, [%rd857]; | |
and.b32 %r2270, %r2269, 65535; | |
bfe.u32 %r2271, %r2269, 16, 6; | |
mul.wide.u32 %rd858, %r2270, 1792; | |
add.s64 %rd859, %rd135, %rd858; | |
mul.wide.u32 %rd860, %r2271, 28; | |
add.s64 %rd861, %rd859, %rd860; | |
ld.global.u32 %r2272, [%rd861]; | |
and.b32 %r2273, %r2272, 65535; | |
shl.b32 %r2274, %r2273, 6; | |
bfe.u32 %r2275, %r2272, 16, 6; | |
or.b32 %r612, %r2274, %r2275; | |
st.local.u32 [%rd1+400], %r612; | |
bfe.u32 %r2276, %r2269, 22, 6; | |
mul.wide.u32 %rd862, %r2276, 28; | |
add.s64 %rd863, %rd859, %rd862; | |
ld.global.u32 %r2277, [%rd863]; | |
and.b32 %r2278, %r2277, 65535; | |
shl.b32 %r2279, %r2278, 6; | |
bfe.u32 %r2280, %r2277, 16, 6; | |
or.b32 %r3891, %r2279, %r2280; | |
st.local.u32 [%rd1+404], %r3891; | |
setp.le.u32 %p98, %r612, %r3891; | |
mov.u32 %r3890, %r612; | |
@%p98 bra BB0_196; | |
st.local.u32 [%rd1+400], %r3891; | |
st.local.u32 [%rd1+404], %r612; | |
mov.u32 %r3583, %r3891; | |
mov.u32 %r3891, %r612; | |
mov.u32 %r3890, %r3583; | |
BB0_196: | |
mov.u32 %r3886, %r3890; | |
mov.u32 %r3887, %r3891; | |
bfe.u32 %r2281, %r611, 22, 6; | |
mul.lo.s64 %rd864, %rd51, 1792; | |
add.s64 %rd865, %rd136, %rd864; | |
mul.wide.u32 %rd866, %r2281, 28; | |
add.s64 %rd867, %rd865, %rd866; | |
ld.global.u32 %r2282, [%rd867]; | |
and.b32 %r2283, %r2282, 65535; | |
bfe.u32 %r2284, %r2282, 16, 6; | |
mul.wide.u32 %rd868, %r2283, 1792; | |
add.s64 %rd869, %rd135, %rd868; | |
mul.wide.u32 %rd870, %r2284, 28; | |
add.s64 %rd871, %rd869, %rd870; | |
ld.global.u32 %r2285, [%rd871]; | |
and.b32 %r2286, %r2285, 65535; | |
shl.b32 %r2287, %r2286, 6; | |
bfe.u32 %r2288, %r2285, 16, 6; | |
or.b32 %r616, %r2287, %r2288; | |
st.local.u32 [%rd1+408], %r616; | |
bfe.u32 %r2289, %r2282, 22, 6; | |
mul.wide.u32 %rd872, %r2289, 28; | |
add.s64 %rd873, %rd869, %rd872; | |
ld.global.u32 %r2290, [%rd873]; | |
and.b32 %r2291, %r2290, 65535; | |
shl.b32 %r2292, %r2291, 6; | |
bfe.u32 %r2293, %r2290, 16, 6; | |
or.b32 %r3893, %r2292, %r2293; | |
st.local.u32 [%rd1+412], %r3893; | |
setp.le.u32 %p99, %r616, %r3893; | |
mov.u32 %r3892, %r616; | |
@%p99 bra BB0_198; | |
st.local.u32 [%rd1+408], %r3893; | |
st.local.u32 [%rd1+412], %r616; | |
mov.u32 %r3589, %r3893; | |
mov.u32 %r3893, %r616; | |
mov.u32 %r3892, %r3589; | |
BB0_198: | |
mov.u32 %r619, %r3892; | |
mov.u32 %r618, %r3893; | |
setp.le.u32 %p100, %r3886, %r619; | |
mov.u32 %r3888, %r619; | |
mov.u32 %r3889, %r618; | |
@%p100 bra BB0_200; | |
st.local.u32 [%rd1+400], %r619; | |
st.local.u32 [%rd1+408], %r3886; | |
st.local.u32 [%rd1+404], %r618; | |
st.local.u32 [%rd1+412], %r3887; | |
mov.u32 %r3586, %r3887; | |
mov.u32 %r3588, %r3886; | |
mov.u32 %r3887, %r618; | |
mov.u32 %r3886, %r619; | |
mov.u32 %r3888, %r3588; | |
mov.u32 %r3889, %r3586; | |
BB0_200: | |
mov.u32 %r623, %r3886; | |
mov.u32 %r622, %r3887; | |
mov.u32 %r621, %r3888; | |
mov.u32 %r620, %r3889; | |
setp.le.u32 %p101, %r3870, %r623; | |
mov.u32 %r3874, %r623; | |
mov.u32 %r3875, %r622; | |
mov.u32 %r3876, %r621; | |
mov.u32 %r3877, %r620; | |
@%p101 bra BB0_202; | |
st.local.u32 [%rd1+384], %r623; | |
st.local.u32 [%rd1+400], %r3870; | |
st.local.u32 [%rd1+388], %r622; | |
st.local.u32 [%rd1+404], %r3871; | |
st.local.u32 [%rd1+392], %r621; | |
st.local.u32 [%rd1+408], %r3872; | |
st.local.u32 [%rd1+396], %r620; | |
st.local.u32 [%rd1+412], %r3873; | |
mov.u32 %r3576, %r3873; | |
mov.u32 %r3578, %r3872; | |
mov.u32 %r3580, %r3871; | |
mov.u32 %r3582, %r3870; | |
mov.u32 %r3873, %r620; | |
mov.u32 %r3872, %r621; | |
mov.u32 %r3871, %r622; | |
mov.u32 %r3870, %r623; | |
mov.u32 %r3874, %r3582; | |
mov.u32 %r3875, %r3580; | |
mov.u32 %r3876, %r3578; | |
mov.u32 %r3877, %r3576; | |
BB0_202: | |
mov.u32 %r3854, %r3870; | |
mov.u32 %r3855, %r3871; | |
mov.u32 %r3856, %r3872; | |
mov.u32 %r3857, %r3873; | |
mov.u32 %r3858, %r3874; | |
mov.u32 %r3859, %r3875; | |
mov.u32 %r3860, %r3876; | |
mov.u32 %r3861, %r3877; | |
mul.lo.s64 %rd874, %rd48, 1792; | |
add.s64 %rd875, %rd136, %rd874; | |
bfe.u32 %r2294, %r596, 22, 6; | |
mul.wide.u32 %rd876, %r2294, 28; | |
add.s64 %rd877, %rd875, %rd876; | |
ld.global.u32 %r632, [%rd877+4]; | |
and.b32 %r2295, %r632, 65535; | |
mul.wide.u32 %rd878, %r2295, 1792; | |
add.s64 %rd879, %rd3, %rd878; | |
cvt.u64.u32 %rd52, %r2295; | |
bfe.u32 %r2296, %r632, 16, 6; | |
mul.wide.u32 %rd880, %r2296, 28; | |
add.s64 %rd881, %rd879, %rd880; | |
ld.global.u32 %r633, [%rd881+-8]; | |
and.b32 %r2297, %r633, 65535; | |
cvt.u64.u32 %rd53, %r2297; | |
bfe.u32 %r2298, %r633, 16, 6; | |
mul.wide.u32 %rd882, %r2297, 1792; | |
add.s64 %rd883, %rd136, %rd882; | |
mul.wide.u32 %rd884, %r2298, 28; | |
add.s64 %rd885, %rd883, %rd884; | |
ld.global.u32 %r2299, [%rd885]; | |
and.b32 %r2300, %r2299, 65535; | |
bfe.u32 %r2301, %r2299, 16, 6; | |
mul.wide.u32 %rd886, %r2300, 1792; | |
add.s64 %rd887, %rd135, %rd886; | |
mul.wide.u32 %rd888, %r2301, 28; | |
add.s64 %rd889, %rd887, %rd888; | |
ld.global.u32 %r2302, [%rd889]; | |
and.b32 %r2303, %r2302, 65535; | |
shl.b32 %r2304, %r2303, 6; | |
bfe.u32 %r2305, %r2302, 16, 6; | |
or.b32 %r634, %r2304, %r2305; | |
st.local.u32 [%rd1+416], %r634; | |
bfe.u32 %r2306, %r2299, 22, 6; | |
mul.wide.u32 %rd890, %r2306, 28; | |
add.s64 %rd891, %rd887, %rd890; | |
ld.global.u32 %r2307, [%rd891]; | |
and.b32 %r2308, %r2307, 65535; | |
shl.b32 %r2309, %r2308, 6; | |
bfe.u32 %r2310, %r2307, 16, 6; | |
or.b32 %r3907, %r2309, %r2310; | |
st.local.u32 [%rd1+420], %r3907; | |
setp.le.u32 %p102, %r634, %r3907; | |
mov.u32 %r3906, %r634; | |
@%p102 bra BB0_204; | |
st.local.u32 [%rd1+416], %r3907; | |
st.local.u32 [%rd1+420], %r634; | |
mov.u32 %r3619, %r3907; | |
mov.u32 %r3907, %r634; | |
mov.u32 %r3906, %r3619; | |
BB0_204: | |
mov.u32 %r3902, %r3906; | |
mov.u32 %r3903, %r3907; | |
bfe.u32 %r2311, %r633, 22, 6; | |
mul.lo.s64 %rd892, %rd53, 1792; | |
add.s64 %rd893, %rd136, %rd892; | |
mul.wide.u32 %rd894, %r2311, 28; | |
add.s64 %rd895, %rd893, %rd894; | |
ld.global.u32 %r2312, [%rd895]; | |
and.b32 %r2313, %r2312, 65535; | |
bfe.u32 %r2314, %r2312, 16, 6; | |
mul.wide.u32 %rd896, %r2313, 1792; | |
add.s64 %rd897, %rd135, %rd896; | |
mul.wide.u32 %rd898, %r2314, 28; | |
add.s64 %rd899, %rd897, %rd898; | |
ld.global.u32 %r2315, [%rd899]; | |
and.b32 %r2316, %r2315, 65535; | |
shl.b32 %r2317, %r2316, 6; | |
bfe.u32 %r2318, %r2315, 16, 6; | |
or.b32 %r638, %r2317, %r2318; | |
st.local.u32 [%rd1+424], %r638; | |
bfe.u32 %r2319, %r2312, 22, 6; | |
mul.wide.u32 %rd900, %r2319, 28; | |
add.s64 %rd901, %rd897, %rd900; | |
ld.global.u32 %r2320, [%rd901]; | |
and.b32 %r2321, %r2320, 65535; | |
shl.b32 %r2322, %r2321, 6; | |
bfe.u32 %r2323, %r2320, 16, 6; | |
or.b32 %r3909, %r2322, %r2323; | |
st.local.u32 [%rd1+428], %r3909; | |
setp.le.u32 %p103, %r638, %r3909; | |
mov.u32 %r3908, %r638; | |
@%p103 bra BB0_206; | |
st.local.u32 [%rd1+424], %r3909; | |
st.local.u32 [%rd1+428], %r638; | |
mov.u32 %r3625, %r3909; | |
mov.u32 %r3909, %r638; | |
mov.u32 %r3908, %r3625; | |
BB0_206: | |
mov.u32 %r641, %r3908; | |
mov.u32 %r640, %r3909; | |
setp.le.u32 %p104, %r3902, %r641; | |
mov.u32 %r3904, %r641; | |
mov.u32 %r3905, %r640; | |
@%p104 bra BB0_208; | |
st.local.u32 [%rd1+416], %r641; | |
st.local.u32 [%rd1+424], %r3902; | |
st.local.u32 [%rd1+420], %r640; | |
st.local.u32 [%rd1+428], %r3903; | |
mov.u32 %r3622, %r3903; | |
mov.u32 %r3624, %r3902; | |
mov.u32 %r3903, %r640; | |
mov.u32 %r3902, %r641; | |
mov.u32 %r3904, %r3624; | |
mov.u32 %r3905, %r3622; | |
BB0_208: | |
mov.u32 %r3894, %r3902; | |
mov.u32 %r3895, %r3903; | |
mov.u32 %r3896, %r3904; | |
mov.u32 %r3897, %r3905; | |
mul.lo.s64 %rd902, %rd52, 1792; | |
add.s64 %rd903, %rd3, %rd902; | |
bfe.u32 %r2324, %r632, 22, 6; | |
mul.wide.u32 %rd904, %r2324, 28; | |
add.s64 %rd905, %rd903, %rd904; | |
ld.global.u32 %r646, [%rd905+-8]; | |
and.b32 %r2325, %r646, 65535; | |
cvt.u64.u32 %rd54, %r2325; | |
bfe.u32 %r2326, %r646, 16, 6; | |
mul.wide.u32 %rd906, %r2325, 1792; | |
add.s64 %rd907, %rd136, %rd906; | |
mul.wide.u32 %rd908, %r2326, 28; | |
add.s64 %rd909, %rd907, %rd908; | |
ld.global.u32 %r2327, [%rd909]; | |
and.b32 %r2328, %r2327, 65535; | |
bfe.u32 %r2329, %r2327, 16, 6; | |
mul.wide.u32 %rd910, %r2328, 1792; | |
add.s64 %rd911, %rd135, %rd910; | |
mul.wide.u32 %rd912, %r2329, 28; | |
add.s64 %rd913, %rd911, %rd912; | |
ld.global.u32 %r2330, [%rd913]; | |
and.b32 %r2331, %r2330, 65535; | |
shl.b32 %r2332, %r2331, 6; | |
bfe.u32 %r2333, %r2330, 16, 6; | |
or.b32 %r647, %r2332, %r2333; | |
st.local.u32 [%rd1+432], %r647; | |
bfe.u32 %r2334, %r2327, 22, 6; | |
mul.wide.u32 %rd914, %r2334, 28; | |
add.s64 %rd915, %rd911, %rd914; | |
ld.global.u32 %r2335, [%rd915]; | |
and.b32 %r2336, %r2335, 65535; | |
shl.b32 %r2337, %r2336, 6; | |
bfe.u32 %r2338, %r2335, 16, 6; | |
or.b32 %r3915, %r2337, %r2338; | |
st.local.u32 [%rd1+436], %r3915; | |
setp.le.u32 %p105, %r647, %r3915; | |
mov.u32 %r3914, %r647; | |
@%p105 bra BB0_210; | |
st.local.u32 [%rd1+432], %r3915; | |
st.local.u32 [%rd1+436], %r647; | |
mov.u32 %r3639, %r3915; | |
mov.u32 %r3915, %r647; | |
mov.u32 %r3914, %r3639; | |
BB0_210: | |
mov.u32 %r3910, %r3914; | |
mov.u32 %r3911, %r3915; | |
bfe.u32 %r2339, %r646, 22, 6; | |
mul.lo.s64 %rd916, %rd54, 1792; | |
add.s64 %rd917, %rd136, %rd916; | |
mul.wide.u32 %rd918, %r2339, 28; | |
add.s64 %rd919, %rd917, %rd918; | |
ld.global.u32 %r2340, [%rd919]; | |
and.b32 %r2341, %r2340, 65535; | |
bfe.u32 %r2342, %r2340, 16, 6; | |
mul.wide.u32 %rd920, %r2341, 1792; | |
add.s64 %rd921, %rd135, %rd920; | |
mul.wide.u32 %rd922, %r2342, 28; | |
add.s64 %rd923, %rd921, %rd922; | |
ld.global.u32 %r2343, [%rd923]; | |
and.b32 %r2344, %r2343, 65535; | |
shl.b32 %r2345, %r2344, 6; | |
bfe.u32 %r2346, %r2343, 16, 6; | |
or.b32 %r651, %r2345, %r2346; | |
st.local.u32 [%rd1+440], %r651; | |
bfe.u32 %r2347, %r2340, 22, 6; | |
mul.wide.u32 %rd924, %r2347, 28; | |
add.s64 %rd925, %rd921, %rd924; | |
ld.global.u32 %r2348, [%rd925]; | |
and.b32 %r2349, %r2348, 65535; | |
shl.b32 %r2350, %r2349, 6; | |
bfe.u32 %r2351, %r2348, 16, 6; | |
or.b32 %r3917, %r2350, %r2351; | |
st.local.u32 [%rd1+444], %r3917; | |
setp.le.u32 %p106, %r651, %r3917; | |
mov.u32 %r3916, %r651; | |
@%p106 bra BB0_212; | |
st.local.u32 [%rd1+440], %r3917; | |
st.local.u32 [%rd1+444], %r651; | |
mov.u32 %r3645, %r3917; | |
mov.u32 %r3917, %r651; | |
mov.u32 %r3916, %r3645; | |
BB0_212: | |
mov.u32 %r654, %r3916; | |
mov.u32 %r653, %r3917; | |
setp.le.u32 %p107, %r3910, %r654; | |
mov.u32 %r3912, %r654; | |
mov.u32 %r3913, %r653; | |
@%p107 bra BB0_214; | |
st.local.u32 [%rd1+432], %r654; | |
st.local.u32 [%rd1+440], %r3910; | |
st.local.u32 [%rd1+436], %r653; | |
st.local.u32 [%rd1+444], %r3911; | |
mov.u32 %r3642, %r3911; | |
mov.u32 %r3644, %r3910; | |
mov.u32 %r3911, %r653; | |
mov.u32 %r3910, %r654; | |
mov.u32 %r3912, %r3644; | |
mov.u32 %r3913, %r3642; | |
BB0_214: | |
mov.u32 %r658, %r3910; | |
mov.u32 %r657, %r3911; | |
mov.u32 %r656, %r3912; | |
mov.u32 %r655, %r3913; | |
setp.le.u32 %p108, %r3894, %r658; | |
mov.u32 %r3898, %r658; | |
mov.u32 %r3899, %r657; | |
mov.u32 %r3900, %r656; | |
mov.u32 %r3901, %r655; | |
@%p108 bra BB0_216; | |
st.local.u32 [%rd1+416], %r658; | |
st.local.u32 [%rd1+432], %r3894; | |
st.local.u32 [%rd1+420], %r657; | |
st.local.u32 [%rd1+436], %r3895; | |
st.local.u32 [%rd1+424], %r656; | |
st.local.u32 [%rd1+440], %r3896; | |
st.local.u32 [%rd1+428], %r655; | |
st.local.u32 [%rd1+444], %r3897; | |
mov.u32 %r3632, %r3897; | |
mov.u32 %r3634, %r3896; | |
mov.u32 %r3636, %r3895; | |
mov.u32 %r3638, %r3894; | |
mov.u32 %r3897, %r655; | |
mov.u32 %r3896, %r656; | |
mov.u32 %r3895, %r657; | |
mov.u32 %r3894, %r658; | |
mov.u32 %r3898, %r3638; | |
mov.u32 %r3899, %r3636; | |
mov.u32 %r3900, %r3634; | |
mov.u32 %r3901, %r3632; | |
BB0_216: | |
mov.u32 %r666, %r3894; | |
mov.u32 %r665, %r3895; | |
mov.u32 %r664, %r3896; | |
mov.u32 %r663, %r3897; | |
mov.u32 %r662, %r3898; | |
mov.u32 %r661, %r3899; | |
mov.u32 %r660, %r3900; | |
mov.u32 %r659, %r3901; | |
setp.le.u32 %p109, %r3854, %r666; | |
mov.u32 %r3862, %r666; | |
mov.u32 %r3863, %r665; | |
mov.u32 %r3864, %r664; | |
mov.u32 %r3865, %r663; | |
mov.u32 %r3866, %r662; | |
mov.u32 %r3867, %r661; | |
mov.u32 %r3868, %r660; | |
mov.u32 %r3869, %r659; | |
@%p109 bra BB0_218; | |
st.local.u32 [%rd1+384], %r666; | |
st.local.u32 [%rd1+416], %r3854; | |
st.local.u32 [%rd1+388], %r665; | |
st.local.u32 [%rd1+420], %r3855; | |
st.local.u32 [%rd1+392], %r664; | |
st.local.u32 [%rd1+424], %r3856; | |
st.local.u32 [%rd1+396], %r663; | |
st.local.u32 [%rd1+428], %r3857; | |
st.local.u32 [%rd1+400], %r662; | |
st.local.u32 [%rd1+432], %r3858; | |
st.local.u32 [%rd1+404], %r661; | |
st.local.u32 [%rd1+436], %r3859; | |
st.local.u32 [%rd1+408], %r660; | |
st.local.u32 [%rd1+440], %r3860; | |
st.local.u32 [%rd1+412], %r659; | |
st.local.u32 [%rd1+444], %r3861; | |
mov.u32 %r3604, %r3861; | |
mov.u32 %r3606, %r3860; | |
mov.u32 %r3608, %r3859; | |
mov.u32 %r3610, %r3858; | |
mov.u32 %r3612, %r3857; | |
mov.u32 %r3614, %r3856; | |
mov.u32 %r3616, %r3855; | |
mov.u32 %r3618, %r3854; | |
mov.u32 %r3861, %r659; | |
mov.u32 %r3860, %r660; | |
mov.u32 %r3859, %r661; | |
mov.u32 %r3858, %r662; | |
mov.u32 %r3857, %r663; | |
mov.u32 %r3856, %r664; | |
mov.u32 %r3855, %r665; | |
mov.u32 %r3854, %r666; | |
mov.u32 %r3862, %r3618; | |
mov.u32 %r3863, %r3616; | |
mov.u32 %r3864, %r3614; | |
mov.u32 %r3865, %r3612; | |
mov.u32 %r3866, %r3610; | |
mov.u32 %r3867, %r3608; | |
mov.u32 %r3868, %r3606; | |
mov.u32 %r3869, %r3604; | |
BB0_218: | |
mov.u32 %r682, %r3854; | |
mul.lo.s64 %rd926, %rd47, 1792; | |
add.s64 %rd927, %rd3, %rd926; | |
bfe.u32 %r2352, %r595, 22, 6; | |
mul.wide.u32 %rd928, %r2352, 28; | |
add.s64 %rd929, %rd927, %rd928; | |
ld.global.u32 %r683, [%rd929+-4]; | |
and.b32 %r2353, %r683, 65535; | |
mul.wide.u32 %rd930, %r2353, 1792; | |
add.s64 %rd931, %rd136, %rd930; | |
bfe.u32 %r2354, %r683, 16, 6; | |
mul.wide.u32 %rd932, %r2354, 28; | |
add.s64 %rd933, %rd931, %rd932; | |
ld.global.u32 %r684, [%rd933+4]; | |
and.b32 %r2355, %r684, 65535; | |
mul.wide.u32 %rd934, %r2355, 1792; | |
add.s64 %rd935, %rd3, %rd934; | |
cvt.u64.u32 %rd55, %r2353; | |
cvt.u64.u32 %rd56, %r2355; | |
bfe.u32 %r2356, %r684, 16, 6; | |
mul.wide.u32 %rd936, %r2356, 28; | |
add.s64 %rd937, %rd935, %rd936; | |
ld.global.u32 %r685, [%rd937+-8]; | |
and.b32 %r2357, %r685, 65535; | |
cvt.u64.u32 %rd57, %r2357; | |
bfe.u32 %r2358, %r685, 16, 6; | |
mul.wide.u32 %rd938, %r2357, 1792; | |
add.s64 %rd939, %rd136, %rd938; | |
mul.wide.u32 %rd940, %r2358, 28; | |
add.s64 %rd941, %rd939, %rd940; | |
ld.global.u32 %r2359, [%rd941]; | |
and.b32 %r2360, %r2359, 65535; | |
bfe.u32 %r2361, %r2359, 16, 6; | |
mul.wide.u32 %rd942, %r2360, 1792; | |
add.s64 %rd943, %rd135, %rd942; | |
mul.wide.u32 %rd944, %r2361, 28; | |
add.s64 %rd945, %rd943, %rd944; | |
ld.global.u32 %r2362, [%rd945]; | |
and.b32 %r2363, %r2362, 65535; | |
shl.b32 %r2364, %r2363, 6; | |
bfe.u32 %r2365, %r2362, 16, 6; | |
or.b32 %r686, %r2364, %r2365; | |
st.local.u32 [%rd1+448], %r686; | |
bfe.u32 %r2366, %r2359, 22, 6; | |
mul.wide.u32 %rd946, %r2366, 28; | |
add.s64 %rd947, %rd943, %rd946; | |
ld.global.u32 %r2367, [%rd947]; | |
and.b32 %r2368, %r2367, 65535; | |
shl.b32 %r2369, %r2368, 6; | |
bfe.u32 %r2370, %r2367, 16, 6; | |
or.b32 %r3819, %r2369, %r2370; | |
st.local.u32 [%rd1+452], %r3819; | |
setp.le.u32 %p110, %r686, %r3819; | |
mov.u32 %r3818, %r686; | |
@%p110 bra BB0_220; | |
st.local.u32 [%rd1+448], %r3819; | |
st.local.u32 [%rd1+452], %r686; | |
mov.u32 %r3676, %r3819; | |
mov.u32 %r3819, %r686; | |
mov.u32 %r3818, %r3676; | |
BB0_220: | |
mov.u32 %r3814, %r3818; | |
mov.u32 %r3815, %r3819; | |
bfe.u32 %r2371, %r685, 22, 6; | |
mul.lo.s64 %rd948, %rd57, 1792; | |
add.s64 %rd949, %rd136, %rd948; | |
mul.wide.u32 %rd950, %r2371, 28; | |
add.s64 %rd951, %rd949, %rd950; | |
ld.global.u32 %r2372, [%rd951]; | |
and.b32 %r2373, %r2372, 65535; | |
bfe.u32 %r2374, %r2372, 16, 6; | |
mul.wide.u32 %rd952, %r2373, 1792; | |
add.s64 %rd953, %rd135, %rd952; | |
mul.wide.u32 %rd954, %r2374, 28; | |
add.s64 %rd955, %rd953, %rd954; | |
ld.global.u32 %r2375, [%rd955]; | |
and.b32 %r2376, %r2375, 65535; | |
shl.b32 %r2377, %r2376, 6; | |
bfe.u32 %r2378, %r2375, 16, 6; | |
or.b32 %r690, %r2377, %r2378; | |
st.local.u32 [%rd1+456], %r690; | |
bfe.u32 %r2379, %r2372, 22, 6; | |
mul.wide.u32 %rd956, %r2379, 28; | |
add.s64 %rd957, %rd953, %rd956; | |
ld.global.u32 %r2380, [%rd957]; | |
and.b32 %r2381, %r2380, 65535; | |
shl.b32 %r2382, %r2381, 6; | |
bfe.u32 %r2383, %r2380, 16, 6; | |
or.b32 %r3821, %r2382, %r2383; | |
st.local.u32 [%rd1+460], %r3821; | |
setp.le.u32 %p111, %r690, %r3821; | |
mov.u32 %r3820, %r690; | |
@%p111 bra BB0_222; | |
st.local.u32 [%rd1+456], %r3821; | |
st.local.u32 [%rd1+460], %r690; | |
mov.u32 %r3682, %r3821; | |
mov.u32 %r3821, %r690; | |
mov.u32 %r3820, %r3682; | |
BB0_222: | |
mov.u32 %r693, %r3820; | |
mov.u32 %r692, %r3821; | |
setp.le.u32 %p112, %r3814, %r693; | |
mov.u32 %r3816, %r693; | |
mov.u32 %r3817, %r692; | |
@%p112 bra BB0_224; | |
st.local.u32 [%rd1+448], %r693; | |
st.local.u32 [%rd1+456], %r3814; | |
st.local.u32 [%rd1+452], %r692; | |
st.local.u32 [%rd1+460], %r3815; | |
mov.u32 %r3679, %r3815; | |
mov.u32 %r3681, %r3814; | |
mov.u32 %r3815, %r692; | |
mov.u32 %r3814, %r693; | |
mov.u32 %r3816, %r3681; | |
mov.u32 %r3817, %r3679; | |
BB0_224: | |
mov.u32 %r3806, %r3814; | |
mov.u32 %r3807, %r3815; | |
mov.u32 %r3808, %r3816; | |
mov.u32 %r3809, %r3817; | |
mul.lo.s64 %rd958, %rd56, 1792; | |
add.s64 %rd959, %rd3, %rd958; | |
bfe.u32 %r2384, %r684, 22, 6; | |
mul.wide.u32 %rd960, %r2384, 28; | |
add.s64 %rd961, %rd959, %rd960; | |
ld.global.u32 %r698, [%rd961+-8]; | |
and.b32 %r2385, %r698, 65535; | |
cvt.u64.u32 %rd58, %r2385; | |
bfe.u32 %r2386, %r698, 16, 6; | |
mul.wide.u32 %rd962, %r2385, 1792; | |
add.s64 %rd963, %rd136, %rd962; | |
mul.wide.u32 %rd964, %r2386, 28; | |
add.s64 %rd965, %rd963, %rd964; | |
ld.global.u32 %r2387, [%rd965]; | |
and.b32 %r2388, %r2387, 65535; | |
bfe.u32 %r2389, %r2387, 16, 6; | |
mul.wide.u32 %rd966, %r2388, 1792; | |
add.s64 %rd967, %rd135, %rd966; | |
mul.wide.u32 %rd968, %r2389, 28; | |
add.s64 %rd969, %rd967, %rd968; | |
ld.global.u32 %r2390, [%rd969]; | |
and.b32 %r2391, %r2390, 65535; | |
shl.b32 %r2392, %r2391, 6; | |
bfe.u32 %r2393, %r2390, 16, 6; | |
or.b32 %r699, %r2392, %r2393; | |
st.local.u32 [%rd1+464], %r699; | |
bfe.u32 %r2394, %r2387, 22, 6; | |
mul.wide.u32 %rd970, %r2394, 28; | |
add.s64 %rd971, %rd967, %rd970; | |
ld.global.u32 %r2395, [%rd971]; | |
and.b32 %r2396, %r2395, 65535; | |
shl.b32 %r2397, %r2396, 6; | |
bfe.u32 %r2398, %r2395, 16, 6; | |
or.b32 %r3827, %r2397, %r2398; | |
st.local.u32 [%rd1+468], %r3827; | |
setp.le.u32 %p113, %r699, %r3827; | |
mov.u32 %r3826, %r699; | |
@%p113 bra BB0_226; | |
st.local.u32 [%rd1+464], %r3827; | |
st.local.u32 [%rd1+468], %r699; | |
mov.u32 %r3696, %r3827; | |
mov.u32 %r3827, %r699; | |
mov.u32 %r3826, %r3696; | |
BB0_226: | |
mov.u32 %r3822, %r3826; | |
mov.u32 %r3823, %r3827; | |
bfe.u32 %r2399, %r698, 22, 6; | |
mul.lo.s64 %rd972, %rd58, 1792; | |
add.s64 %rd973, %rd136, %rd972; | |
mul.wide.u32 %rd974, %r2399, 28; | |
add.s64 %rd975, %rd973, %rd974; | |
ld.global.u32 %r2400, [%rd975]; | |
and.b32 %r2401, %r2400, 65535; | |
bfe.u32 %r2402, %r2400, 16, 6; | |
mul.wide.u32 %rd976, %r2401, 1792; | |
add.s64 %rd977, %rd135, %rd976; | |
mul.wide.u32 %rd978, %r2402, 28; | |
add.s64 %rd979, %rd977, %rd978; | |
ld.global.u32 %r2403, [%rd979]; | |
and.b32 %r2404, %r2403, 65535; | |
shl.b32 %r2405, %r2404, 6; | |
bfe.u32 %r2406, %r2403, 16, 6; | |
or.b32 %r703, %r2405, %r2406; | |
st.local.u32 [%rd1+472], %r703; | |
bfe.u32 %r2407, %r2400, 22, 6; | |
mul.wide.u32 %rd980, %r2407, 28; | |
add.s64 %rd981, %rd977, %rd980; | |
ld.global.u32 %r2408, [%rd981]; | |
and.b32 %r2409, %r2408, 65535; | |
shl.b32 %r2410, %r2409, 6; | |
bfe.u32 %r2411, %r2408, 16, 6; | |
or.b32 %r3829, %r2410, %r2411; | |
st.local.u32 [%rd1+476], %r3829; | |
setp.le.u32 %p114, %r703, %r3829; | |
mov.u32 %r3828, %r703; | |
@%p114 bra BB0_228; | |
st.local.u32 [%rd1+472], %r3829; | |
st.local.u32 [%rd1+476], %r703; | |
mov.u32 %r3702, %r3829; | |
mov.u32 %r3829, %r703; | |
mov.u32 %r3828, %r3702; | |
BB0_228: | |
mov.u32 %r706, %r3828; | |
mov.u32 %r705, %r3829; | |
setp.le.u32 %p115, %r3822, %r706; | |
mov.u32 %r3824, %r706; | |
mov.u32 %r3825, %r705; | |
@%p115 bra BB0_230; | |
st.local.u32 [%rd1+464], %r706; | |
st.local.u32 [%rd1+472], %r3822; | |
st.local.u32 [%rd1+468], %r705; | |
st.local.u32 [%rd1+476], %r3823; | |
mov.u32 %r3699, %r3823; | |
mov.u32 %r3701, %r3822; | |
mov.u32 %r3823, %r705; | |
mov.u32 %r3822, %r706; | |
mov.u32 %r3824, %r3701; | |
mov.u32 %r3825, %r3699; | |
BB0_230: | |
mov.u32 %r710, %r3822; | |
mov.u32 %r709, %r3823; | |
mov.u32 %r708, %r3824; | |
mov.u32 %r707, %r3825; | |
setp.le.u32 %p116, %r3806, %r710; | |
mov.u32 %r3810, %r710; | |
mov.u32 %r3811, %r709; | |
mov.u32 %r3812, %r708; | |
mov.u32 %r3813, %r707; | |
@%p116 bra BB0_232; | |
st.local.u32 [%rd1+448], %r710; | |
st.local.u32 [%rd1+464], %r3806; | |
st.local.u32 [%rd1+452], %r709; | |
st.local.u32 [%rd1+468], %r3807; | |
st.local.u32 [%rd1+456], %r708; | |
st.local.u32 [%rd1+472], %r3808; | |
st.local.u32 [%rd1+460], %r707; | |
st.local.u32 [%rd1+476], %r3809; | |
mov.u32 %r3689, %r3809; | |
mov.u32 %r3691, %r3808; | |
mov.u32 %r3693, %r3807; | |
mov.u32 %r3695, %r3806; | |
mov.u32 %r3809, %r707; | |
mov.u32 %r3808, %r708; | |
mov.u32 %r3807, %r709; | |
mov.u32 %r3806, %r710; | |
mov.u32 %r3810, %r3695; | |
mov.u32 %r3811, %r3693; | |
mov.u32 %r3812, %r3691; | |
mov.u32 %r3813, %r3689; | |
BB0_232: | |
mov.u32 %r3790, %r3806; | |
mov.u32 %r3791, %r3807; | |
mov.u32 %r3792, %r3808; | |
mov.u32 %r3793, %r3809; | |
mov.u32 %r3794, %r3810; | |
mov.u32 %r3795, %r3811; | |
mov.u32 %r3796, %r3812; | |
mov.u32 %r3797, %r3813; | |
mul.lo.s64 %rd982, %rd55, 1792; | |
add.s64 %rd983, %rd136, %rd982; | |
bfe.u32 %r2412, %r683, 22, 6; | |
mul.wide.u32 %rd984, %r2412, 28; | |
add.s64 %rd985, %rd983, %rd984; | |
ld.global.u32 %r719, [%rd985+4]; | |
and.b32 %r2413, %r719, 65535; | |
mul.wide.u32 %rd986, %r2413, 1792; | |
add.s64 %rd987, %rd3, %rd986; | |
cvt.u64.u32 %rd59, %r2413; | |
bfe.u32 %r2414, %r719, 16, 6; | |
mul.wide.u32 %rd988, %r2414, 28; | |
add.s64 %rd989, %rd987, %rd988; | |
ld.global.u32 %r720, [%rd989+-8]; | |
and.b32 %r2415, %r720, 65535; | |
cvt.u64.u32 %rd60, %r2415; | |
bfe.u32 %r2416, %r720, 16, 6; | |
mul.wide.u32 %rd990, %r2415, 1792; | |
add.s64 %rd991, %rd136, %rd990; | |
mul.wide.u32 %rd992, %r2416, 28; | |
add.s64 %rd993, %rd991, %rd992; | |
ld.global.u32 %r2417, [%rd993]; | |
and.b32 %r2418, %r2417, 65535; | |
bfe.u32 %r2419, %r2417, 16, 6; | |
mul.wide.u32 %rd994, %r2418, 1792; | |
add.s64 %rd995, %rd135, %rd994; | |
mul.wide.u32 %rd996, %r2419, 28; | |
add.s64 %rd997, %rd995, %rd996; | |
ld.global.u32 %r2420, [%rd997]; | |
and.b32 %r2421, %r2420, 65535; | |
shl.b32 %r2422, %r2421, 6; | |
bfe.u32 %r2423, %r2420, 16, 6; | |
or.b32 %r721, %r2422, %r2423; | |
st.local.u32 [%rd1+480], %r721; | |
bfe.u32 %r2424, %r2417, 22, 6; | |
mul.wide.u32 %rd998, %r2424, 28; | |
add.s64 %rd999, %rd995, %rd998; | |
ld.global.u32 %r2425, [%rd999]; | |
and.b32 %r2426, %r2425, 65535; | |
shl.b32 %r2427, %r2426, 6; | |
bfe.u32 %r2428, %r2425, 16, 6; | |
or.b32 %r3843, %r2427, %r2428; | |
st.local.u32 [%rd1+484], %r3843; | |
setp.le.u32 %p117, %r721, %r3843; | |
mov.u32 %r3842, %r721; | |
@%p117 bra BB0_234; | |
st.local.u32 [%rd1+480], %r3843; | |
st.local.u32 [%rd1+484], %r721; | |
mov.u32 %r3732, %r3843; | |
mov.u32 %r3843, %r721; | |
mov.u32 %r3842, %r3732; | |
BB0_234: | |
mov.u32 %r3838, %r3842; | |
mov.u32 %r3839, %r3843; | |
bfe.u32 %r2429, %r720, 22, 6; | |
mul.lo.s64 %rd1000, %rd60, 1792; | |
add.s64 %rd1001, %rd136, %rd1000; | |
mul.wide.u32 %rd1002, %r2429, 28; | |
add.s64 %rd1003, %rd1001, %rd1002; | |
ld.global.u32 %r2430, [%rd1003]; | |
and.b32 %r2431, %r2430, 65535; | |
bfe.u32 %r2432, %r2430, 16, 6; | |
mul.wide.u32 %rd1004, %r2431, 1792; | |
add.s64 %rd1005, %rd135, %rd1004; | |
mul.wide.u32 %rd1006, %r2432, 28; | |
add.s64 %rd1007, %rd1005, %rd1006; | |
ld.global.u32 %r2433, [%rd1007]; | |
and.b32 %r2434, %r2433, 65535; | |
shl.b32 %r2435, %r2434, 6; | |
bfe.u32 %r2436, %r2433, 16, 6; | |
or.b32 %r725, %r2435, %r2436; | |
st.local.u32 [%rd1+488], %r725; | |
bfe.u32 %r2437, %r2430, 22, 6; | |
mul.wide.u32 %rd1008, %r2437, 28; | |
add.s64 %rd1009, %rd1005, %rd1008; | |
ld.global.u32 %r2438, [%rd1009]; | |
and.b32 %r2439, %r2438, 65535; | |
shl.b32 %r2440, %r2439, 6; | |
bfe.u32 %r2441, %r2438, 16, 6; | |
or.b32 %r3845, %r2440, %r2441; | |
st.local.u32 [%rd1+492], %r3845; | |
setp.le.u32 %p118, %r725, %r3845; | |
mov.u32 %r3844, %r725; | |
@%p118 bra BB0_236; | |
st.local.u32 [%rd1+488], %r3845; | |
st.local.u32 [%rd1+492], %r725; | |
mov.u32 %r3738, %r3845; | |
mov.u32 %r3845, %r725; | |
mov.u32 %r3844, %r3738; | |
BB0_236: | |
mov.u32 %r728, %r3844; | |
mov.u32 %r727, %r3845; | |
setp.le.u32 %p119, %r3838, %r728; | |
mov.u32 %r3840, %r728; | |
mov.u32 %r3841, %r727; | |
@%p119 bra BB0_238; | |
st.local.u32 [%rd1+480], %r728; | |
st.local.u32 [%rd1+488], %r3838; | |
st.local.u32 [%rd1+484], %r727; | |
st.local.u32 [%rd1+492], %r3839; | |
mov.u32 %r3735, %r3839; | |
mov.u32 %r3737, %r3838; | |
mov.u32 %r3839, %r727; | |
mov.u32 %r3838, %r728; | |
mov.u32 %r3840, %r3737; | |
mov.u32 %r3841, %r3735; | |
BB0_238: | |
mov.u32 %r3830, %r3838; | |
mov.u32 %r3831, %r3839; | |
mov.u32 %r3832, %r3840; | |
mov.u32 %r3833, %r3841; | |
mul.lo.s64 %rd1010, %rd59, 1792; | |
add.s64 %rd1011, %rd3, %rd1010; | |
bfe.u32 %r2442, %r719, 22, 6; | |
mul.wide.u32 %rd1012, %r2442, 28; | |
add.s64 %rd1013, %rd1011, %rd1012; | |
ld.global.u32 %r733, [%rd1013+-8]; | |
and.b32 %r2443, %r733, 65535; | |
cvt.u64.u32 %rd61, %r2443; | |
bfe.u32 %r2444, %r733, 16, 6; | |
mul.wide.u32 %rd1014, %r2443, 1792; | |
add.s64 %rd1015, %rd136, %rd1014; | |
mul.wide.u32 %rd1016, %r2444, 28; | |
add.s64 %rd1017, %rd1015, %rd1016; | |
ld.global.u32 %r2445, [%rd1017]; | |
and.b32 %r2446, %r2445, 65535; | |
bfe.u32 %r2447, %r2445, 16, 6; | |
mul.wide.u32 %rd1018, %r2446, 1792; | |
add.s64 %rd1019, %rd135, %rd1018; | |
mul.wide.u32 %rd1020, %r2447, 28; | |
add.s64 %rd1021, %rd1019, %rd1020; | |
ld.global.u32 %r2448, [%rd1021]; | |
and.b32 %r2449, %r2448, 65535; | |
shl.b32 %r2450, %r2449, 6; | |
bfe.u32 %r2451, %r2448, 16, 6; | |
or.b32 %r734, %r2450, %r2451; | |
st.local.u32 [%rd1+496], %r734; | |
bfe.u32 %r2452, %r2445, 22, 6; | |
mul.wide.u32 %rd1022, %r2452, 28; | |
add.s64 %rd1023, %rd1019, %rd1022; | |
ld.global.u32 %r2453, [%rd1023]; | |
and.b32 %r2454, %r2453, 65535; | |
shl.b32 %r2455, %r2454, 6; | |
bfe.u32 %r2456, %r2453, 16, 6; | |
or.b32 %r3851, %r2455, %r2456; | |
st.local.u32 [%rd1+500], %r3851; | |
setp.le.u32 %p120, %r734, %r3851; | |
mov.u32 %r3850, %r734; | |
@%p120 bra BB0_240; | |
st.local.u32 [%rd1+496], %r3851; | |
st.local.u32 [%rd1+500], %r734; | |
mov.u32 %r3752, %r3851; | |
mov.u32 %r3851, %r734; | |
mov.u32 %r3850, %r3752; | |
BB0_240: | |
mov.u32 %r3846, %r3850; | |
mov.u32 %r3847, %r3851; | |
bfe.u32 %r2457, %r733, 22, 6; | |
mul.lo.s64 %rd1024, %rd61, 1792; | |
add.s64 %rd1025, %rd136, %rd1024; | |
mul.wide.u32 %rd1026, %r2457, 28; | |
add.s64 %rd1027, %rd1025, %rd1026; | |
ld.global.u32 %r2458, [%rd1027]; | |
and.b32 %r2459, %r2458, 65535; | |
bfe.u32 %r2460, %r2458, 16, 6; | |
mul.wide.u32 %rd1028, %r2459, 1792; | |
add.s64 %rd1029, %rd135, %rd1028; | |
mul.wide.u32 %rd1030, %r2460, 28; | |
add.s64 %rd1031, %rd1029, %rd1030; | |
ld.global.u32 %r2461, [%rd1031]; | |
and.b32 %r2462, %r2461, 65535; | |
shl.b32 %r2463, %r2462, 6; | |
bfe.u32 %r2464, %r2461, 16, 6; | |
or.b32 %r738, %r2463, %r2464; | |
st.local.u32 [%rd1+504], %r738; | |
bfe.u32 %r2465, %r2458, 22, 6; | |
mul.wide.u32 %rd1032, %r2465, 28; | |
add.s64 %rd1033, %rd1029, %rd1032; | |
ld.global.u32 %r2466, [%rd1033]; | |
and.b32 %r2467, %r2466, 65535; | |
shl.b32 %r2468, %r2467, 6; | |
bfe.u32 %r2469, %r2466, 16, 6; | |
or.b32 %r3853, %r2468, %r2469; | |
st.local.u32 [%rd1+508], %r3853; | |
setp.le.u32 %p121, %r738, %r3853; | |
mov.u32 %r3852, %r738; | |
@%p121 bra BB0_242; | |
st.local.u32 [%rd1+504], %r3853; | |
st.local.u32 [%rd1+508], %r738; | |
mov.u32 %r3758, %r3853; | |
mov.u32 %r3853, %r738; | |
mov.u32 %r3852, %r3758; | |
BB0_242: | |
mov.u32 %r741, %r3852; | |
mov.u32 %r740, %r3853; | |
setp.le.u32 %p122, %r3846, %r741; | |
mov.u32 %r3848, %r741; | |
mov.u32 %r3849, %r740; | |
@%p122 bra BB0_244; | |
st.local.u32 [%rd1+496], %r741; | |
st.local.u32 [%rd1+504], %r3846; | |
st.local.u32 [%rd1+500], %r740; | |
st.local.u32 [%rd1+508], %r3847; | |
mov.u32 %r3755, %r3847; | |
mov.u32 %r3757, %r3846; | |
mov.u32 %r3847, %r740; | |
mov.u32 %r3846, %r741; | |
mov.u32 %r3848, %r3757; | |
mov.u32 %r3849, %r3755; | |
BB0_244: | |
mov.u32 %r745, %r3846; | |
mov.u32 %r744, %r3847; | |
mov.u32 %r743, %r3848; | |
mov.u32 %r742, %r3849; | |
setp.le.u32 %p123, %r3830, %r745; | |
mov.u32 %r3834, %r745; | |
mov.u32 %r3835, %r744; | |
mov.u32 %r3836, %r743; | |
mov.u32 %r3837, %r742; | |
@%p123 bra BB0_246; | |
st.local.u32 [%rd1+480], %r745; | |
st.local.u32 [%rd1+496], %r3830; | |
st.local.u32 [%rd1+484], %r744; | |
st.local.u32 [%rd1+500], %r3831; | |
st.local.u32 [%rd1+488], %r743; | |
st.local.u32 [%rd1+504], %r3832; | |
st.local.u32 [%rd1+492], %r742; | |
st.local.u32 [%rd1+508], %r3833; | |
mov.u32 %r3745, %r3833; | |
mov.u32 %r3747, %r3832; | |
mov.u32 %r3749, %r3831; | |
mov.u32 %r3751, %r3830; | |
mov.u32 %r3833, %r742; | |
mov.u32 %r3832, %r743; | |
mov.u32 %r3831, %r744; | |
mov.u32 %r3830, %r745; | |
mov.u32 %r3834, %r3751; | |
mov.u32 %r3835, %r3749; | |
mov.u32 %r3836, %r3747; | |
mov.u32 %r3837, %r3745; | |
BB0_246: | |
mov.u32 %r753, %r3830; | |
mov.u32 %r752, %r3831; | |
mov.u32 %r751, %r3832; | |
mov.u32 %r750, %r3833; | |
mov.u32 %r749, %r3834; | |
mov.u32 %r748, %r3835; | |
mov.u32 %r747, %r3836; | |
mov.u32 %r746, %r3837; | |
setp.le.u32 %p124, %r3790, %r753; | |
mov.u32 %r3798, %r753; | |
mov.u32 %r3799, %r752; | |
mov.u32 %r3800, %r751; | |
mov.u32 %r3801, %r750; | |
mov.u32 %r3802, %r749; | |
mov.u32 %r3803, %r748; | |
mov.u32 %r3804, %r747; | |
mov.u32 %r3805, %r746; | |
@%p124 bra BB0_248; | |
st.local.u32 [%rd1+448], %r753; | |
st.local.u32 [%rd1+480], %r3790; | |
st.local.u32 [%rd1+452], %r752; | |
st.local.u32 [%rd1+484], %r3791; | |
st.local.u32 [%rd1+456], %r751; | |
st.local.u32 [%rd1+488], %r3792; | |
st.local.u32 [%rd1+460], %r750; | |
st.local.u32 [%rd1+492], %r3793; | |
st.local.u32 [%rd1+464], %r749; | |
st.local.u32 [%rd1+496], %r3794; | |
st.local.u32 [%rd1+468], %r748; | |
st.local.u32 [%rd1+500], %r3795; | |
st.local.u32 [%rd1+472], %r747; | |
st.local.u32 [%rd1+504], %r3796; | |
st.local.u32 [%rd1+476], %r746; | |
st.local.u32 [%rd1+508], %r3797; | |
mov.u32 %r3717, %r3797; | |
mov.u32 %r3719, %r3796; | |
mov.u32 %r3721, %r3795; | |
mov.u32 %r3723, %r3794; | |
mov.u32 %r3725, %r3793; | |
mov.u32 %r3727, %r3792; | |
mov.u32 %r3729, %r3791; | |
mov.u32 %r3731, %r3790; | |
mov.u32 %r3797, %r746; | |
mov.u32 %r3796, %r747; | |
mov.u32 %r3795, %r748; | |
mov.u32 %r3794, %r749; | |
mov.u32 %r3793, %r750; | |
mov.u32 %r3792, %r751; | |
mov.u32 %r3791, %r752; | |
mov.u32 %r3790, %r753; | |
mov.u32 %r3798, %r3731; | |
mov.u32 %r3799, %r3729; | |
mov.u32 %r3800, %r3727; | |
mov.u32 %r3801, %r3725; | |
mov.u32 %r3802, %r3723; | |
mov.u32 %r3803, %r3721; | |
mov.u32 %r3804, %r3719; | |
mov.u32 %r3805, %r3717; | |
BB0_248: | |
mov.u32 %r769, %r3790; | |
setp.le.u32 %p125, %r682, %r769; | |
mov.u32 %r3789, %r682; | |
@%p125 bra BB0_250; | |
st.local.u32 [%rd1+384], %r769; | |
st.local.u32 [%rd1+448], %r682; | |
st.local.u32 [%rd1+388], %r3791; | |
st.local.u32 [%rd1+452], %r3855; | |
st.local.u32 [%rd1+392], %r3792; | |
st.local.u32 [%rd1+456], %r3856; | |
st.local.u32 [%rd1+396], %r3793; | |
st.local.u32 [%rd1+460], %r3857; | |
st.local.u32 [%rd1+400], %r3794; | |
st.local.u32 [%rd1+464], %r3858; | |
st.local.u32 [%rd1+404], %r3795; | |
st.local.u32 [%rd1+468], %r3859; | |
st.local.u32 [%rd1+408], %r3796; | |
st.local.u32 [%rd1+472], %r3860; | |
st.local.u32 [%rd1+412], %r3797; | |
st.local.u32 [%rd1+476], %r3861; | |
st.local.u32 [%rd1+416], %r3798; | |
st.local.u32 [%rd1+480], %r3862; | |
st.local.u32 [%rd1+420], %r3799; | |
st.local.u32 [%rd1+484], %r3863; | |
st.local.u32 [%rd1+424], %r3800; | |
st.local.u32 [%rd1+488], %r3864; | |
st.local.u32 [%rd1+428], %r3801; | |
st.local.u32 [%rd1+492], %r3865; | |
st.local.u32 [%rd1+432], %r3802; | |
st.local.u32 [%rd1+496], %r3866; | |
st.local.u32 [%rd1+436], %r3803; | |
st.local.u32 [%rd1+500], %r3867; | |
st.local.u32 [%rd1+440], %r3804; | |
st.local.u32 [%rd1+504], %r3868; | |
st.local.u32 [%rd1+444], %r3805; | |
st.local.u32 [%rd1+508], %r3869; | |
mov.u32 %r3789, %r769; | |
BB0_250: | |
mov.u32 %r3918, 0; | |
setp.le.u32 %p126, %r4146, %r3789; | |
@%p126 bra BB0_253; | |
BB0_251: | |
mul.wide.u32 %rd1034, %r3918, 4; | |
add.s64 %rd1035, %rd1, %rd1034; | |
ld.local.u32 %r2471, [%rd1035+256]; | |
ld.local.u32 %r2472, [%rd1035+384]; | |
ld.local.u32 %r2473, [%rd1035+260]; | |
ld.local.u32 %r2474, [%rd1035+388]; | |
ld.local.u32 %r2475, [%rd1035+264]; | |
ld.local.u32 %r2476, [%rd1035+392]; | |
ld.local.u32 %r2477, [%rd1035+268]; | |
ld.local.u32 %r2478, [%rd1035+396]; | |
ld.local.u32 %r2479, [%rd1035+272]; | |
ld.local.u32 %r2480, [%rd1035+400]; | |
ld.local.u32 %r2481, [%rd1035+276]; | |
ld.local.u32 %r2482, [%rd1035+404]; | |
ld.local.u32 %r2483, [%rd1035+280]; | |
ld.local.u32 %r2484, [%rd1035+408]; | |
ld.local.u32 %r2485, [%rd1035+284]; | |
ld.local.u32 %r2486, [%rd1035+412]; | |
st.local.u32 [%rd1035+256], %r2472; | |
st.local.u32 [%rd1035+384], %r2471; | |
st.local.u32 [%rd1035+260], %r2474; | |
st.local.u32 [%rd1035+388], %r2473; | |
st.local.u32 [%rd1035+264], %r2476; | |
st.local.u32 [%rd1035+392], %r2475; | |
st.local.u32 [%rd1035+268], %r2478; | |
st.local.u32 [%rd1035+396], %r2477; | |
st.local.u32 [%rd1035+272], %r2480; | |
st.local.u32 [%rd1035+400], %r2479; | |
st.local.u32 [%rd1035+276], %r2482; | |
st.local.u32 [%rd1035+404], %r2481; | |
st.local.u32 [%rd1035+280], %r2484; | |
st.local.u32 [%rd1035+408], %r2483; | |
st.local.u32 [%rd1035+284], %r2486; | |
st.local.u32 [%rd1035+412], %r2485; | |
add.s32 %r3918, %r3918, 8; | |
setp.ne.s32 %p127, %r3918, 32; | |
@%p127 bra BB0_251; | |
ld.local.u32 %r4857, [%rd1]; | |
ld.local.u32 %r4146, [%rd1+256]; | |
BB0_253: | |
mov.u32 %r4856, %r4857; | |
mov.u32 %r5179, 0; | |
setp.le.u32 %p128, %r4856, %r4146; | |
@%p128 bra BB0_256; | |
bra.uni BB0_254; | |
BB0_255: | |
ld.local.u32 %r4856, [%rd62+64]; | |
BB0_254: | |
mov.u32 %r777, %r4856; | |
mul.wide.u32 %rd1036, %r5179, 4; | |
add.s64 %rd62, %rd1, %rd1036; | |
ld.local.u32 %r2488, [%rd62+256]; | |
ld.local.u32 %r2489, [%rd62+4]; | |
ld.local.u32 %r2490, [%rd62+260]; | |
ld.local.u32 %r2491, [%rd62+8]; | |
ld.local.u32 %r2492, [%rd62+264]; | |
ld.local.u32 %r2493, [%rd62+12]; | |
ld.local.u32 %r2494, [%rd62+268]; | |
ld.local.u32 %r2495, [%rd62+16]; | |
ld.local.u32 %r2496, [%rd62+272]; | |
ld.local.u32 %r2497, [%rd62+20]; | |
ld.local.u32 %r2498, [%rd62+276]; | |
ld.local.u32 %r2499, [%rd62+24]; | |
ld.local.u32 %r2500, [%rd62+280]; | |
ld.local.u32 %r2501, [%rd62+28]; | |
ld.local.u32 %r2502, [%rd62+284]; | |
ld.local.u32 %r2503, [%rd62+32]; | |
ld.local.u32 %r2504, [%rd62+288]; | |
ld.local.u32 %r2505, [%rd62+36]; | |
ld.local.u32 %r2506, [%rd62+292]; | |
ld.local.u32 %r2507, [%rd62+40]; | |
ld.local.u32 %r2508, [%rd62+296]; | |
ld.local.u32 %r2509, [%rd62+44]; | |
ld.local.u32 %r2510, [%rd62+300]; | |
ld.local.u32 %r2511, [%rd62+48]; | |
ld.local.u32 %r2512, [%rd62+304]; | |
ld.local.u32 %r2513, [%rd62+52]; | |
ld.local.u32 %r2514, [%rd62+308]; | |
st.local.u32 [%rd62], %r2488; | |
st.local.u32 [%rd62+256], %r777; | |
st.local.u32 [%rd62+4], %r2490; | |
st.local.u32 [%rd62+260], %r2489; | |
st.local.u32 [%rd62+8], %r2492; | |
st.local.u32 [%rd62+264], %r2491; | |
st.local.u32 [%rd62+12], %r2494; | |
st.local.u32 [%rd62+268], %r2493; | |
st.local.u32 [%rd62+16], %r2496; | |
st.local.u32 [%rd62+272], %r2495; | |
st.local.u32 [%rd62+20], %r2498; | |
st.local.u32 [%rd62+276], %r2497; | |
st.local.u32 [%rd62+24], %r2500; | |
st.local.u32 [%rd62+280], %r2499; | |
st.local.u32 [%rd62+28], %r2502; | |
st.local.u32 [%rd62+284], %r2501; | |
st.local.u32 [%rd62+32], %r2504; | |
st.local.u32 [%rd62+288], %r2503; | |
st.local.u32 [%rd62+36], %r2506; | |
st.local.u32 [%rd62+292], %r2505; | |
st.local.u32 [%rd62+40], %r2508; | |
st.local.u32 [%rd62+296], %r2507; | |
st.local.u32 [%rd62+44], %r2510; | |
st.local.u32 [%rd62+300], %r2509; | |
st.local.u32 [%rd62+48], %r2512; | |
st.local.u32 [%rd62+304], %r2511; | |
st.local.u32 [%rd62+52], %r2514; | |
st.local.u32 [%rd62+308], %r2513; | |
ld.local.u32 %r2515, [%rd62+56]; | |
ld.local.u32 %r2516, [%rd62+312]; | |
ld.local.u32 %r2517, [%rd62+60]; | |
ld.local.u32 %r2518, [%rd62+316]; | |
st.local.u32 [%rd62+56], %r2516; | |
st.local.u32 [%rd62+312], %r2515; | |
st.local.u32 [%rd62+60], %r2518; | |
st.local.u32 [%rd62+316], %r2517; | |
add.s32 %r5179, %r5179, 16; | |
setp.eq.s32 %p129, %r5179, 64; | |
@%p129 bra BB0_256; | |
bra.uni BB0_255; | |
BB0_256: | |
ld.param.u32 %r3562, [local_listindices8_param_2]; | |
bfe.u32 %r2519, %r3562, 22, 6; | |
mul.wide.u32 %rd1040, %r2519, 28; | |
add.s64 %rd1041, %rd139, %rd1040; | |
ld.global.u32 %r781, [%rd1041+12]; | |
and.b32 %r2521, %r781, 65535; | |
bfe.u32 %r2522, %r781, 16, 6; | |
mul.wide.u32 %rd1042, %r2521, 1792; | |
add.s64 %rd1043, %rd3, %rd1042; | |
mul.wide.u32 %rd1044, %r2522, 28; | |
add.s64 %rd1045, %rd1043, %rd1044; | |
ld.global.u32 %r782, [%rd1045]; | |
and.b32 %r2523, %r782, 65535; | |
mul.wide.u32 %rd1046, %r2523, 1792; | |
add.s64 %rd1047, %rd146, %rd1046; | |
bfe.u32 %r2524, %r782, 16, 6; | |
mul.wide.u32 %rd1048, %r2524, 28; | |
add.s64 %rd1049, %rd1047, %rd1048; | |
ld.global.u32 %r783, [%rd1049+4]; | |
and.b32 %r2525, %r783, 65535; | |
mul.wide.u32 %rd1050, %r2525, 1792; | |
add.s64 %rd1051, %rd3, %rd1050; | |
bfe.u32 %r2526, %r783, 16, 6; | |
mul.wide.u32 %rd1052, %r2526, 28; | |
add.s64 %rd1053, %rd1051, %rd1052; | |
ld.global.u32 %r784, [%rd1053+-4]; | |
and.b32 %r2527, %r784, 65535; | |
bfe.u32 %r2528, %r784, 16, 6; | |
mul.wide.u32 %rd1054, %r2527, 1792; | |
add.s64 %rd1055, %rd146, %rd1054; | |
mul.wide.u32 %rd1056, %r2528, 28; | |
add.s64 %rd1057, %rd1055, %rd1056; | |
ld.global.u32 %r785, [%rd1057]; | |
and.b32 %r2529, %r785, 65535; | |
mul.wide.u32 %rd1058, %r2529, 1792; | |
add.s64 %rd1059, %rd3, %rd1058; | |
cvt.u64.u32 %rd63, %r2521; | |
cvt.u64.u32 %rd64, %r2523; | |
cvt.u64.u32 %rd65, %r2525; | |
cvt.u64.u32 %rd66, %r2527; | |
cvt.u64.u32 %rd67, %r2529; | |
bfe.u32 %r2530, %r785, 16, 6; | |
mul.wide.u32 %rd1060, %r2530, 28; | |
add.s64 %rd1061, %rd1059, %rd1060; | |
ld.global.u32 %r786, [%rd1061+-8]; | |
and.b32 %r2531, %r786, 65535; | |
cvt.u64.u32 %rd68, %r2531; | |
bfe.u32 %r2532, %r786, 16, 6; | |
mul.wide.u32 %rd1062, %r2531, 1792; | |
add.s64 %rd1063, %rd136, %rd1062; | |
mul.wide.u32 %rd1064, %r2532, 28; | |
add.s64 %rd1065, %rd1063, %rd1064; | |
ld.global.u32 %r2533, [%rd1065]; | |
and.b32 %r2534, %r2533, 65535; | |
bfe.u32 %r2535, %r2533, 16, 6; | |
mul.wide.u32 %rd1066, %r2534, 1792; | |
add.s64 %rd1067, %rd135, %rd1066; | |
mul.wide.u32 %rd1068, %r2535, 28; | |
add.s64 %rd1069, %rd1067, %rd1068; | |
ld.global.u32 %r2536, [%rd1069]; | |
and.b32 %r2537, %r2536, 65535; | |
shl.b32 %r2538, %r2537, 6; | |
bfe.u32 %r2539, %r2536, 16, 6; | |
or.b32 %r787, %r2538, %r2539; | |
st.local.u32 [%rd1+512], %r787; | |
bfe.u32 %r2540, %r2533, 22, 6; | |
mul.wide.u32 %rd1070, %r2540, 28; | |
add.s64 %rd1071, %rd1067, %rd1070; | |
ld.global.u32 %r2541, [%rd1071]; | |
and.b32 %r2542, %r2541, 65535; | |
shl.b32 %r2543, %r2542, 6; | |
bfe.u32 %r2544, %r2541, 16, 6; | |
or.b32 %r5500, %r2543, %r2544; | |
st.local.u32 [%rd1+516], %r5500; | |
setp.le.u32 %p130, %r787, %r5500; | |
mov.u32 %r5499, %r787; | |
@%p130 bra BB0_258; | |
st.local.u32 [%rd1+512], %r5500; | |
st.local.u32 [%rd1+516], %r787; | |
mov.u32 %r5180, %r5500; | |
mov.u32 %r5500, %r787; | |
mov.u32 %r5499, %r5180; | |
BB0_258: | |
mov.u32 %r5495, %r5499; | |
mov.u32 %r5496, %r5500; | |
bfe.u32 %r2545, %r786, 22, 6; | |
mul.lo.s64 %rd1072, %rd68, 1792; | |
add.s64 %rd1073, %rd136, %rd1072; | |
mul.wide.u32 %rd1074, %r2545, 28; | |
add.s64 %rd1075, %rd1073, %rd1074; | |
ld.global.u32 %r2546, [%rd1075]; | |
and.b32 %r2547, %r2546, 65535; | |
bfe.u32 %r2548, %r2546, 16, 6; | |
mul.wide.u32 %rd1076, %r2547, 1792; | |
add.s64 %rd1077, %rd135, %rd1076; | |
mul.wide.u32 %rd1078, %r2548, 28; | |
add.s64 %rd1079, %rd1077, %rd1078; | |
ld.global.u32 %r2549, [%rd1079]; | |
and.b32 %r2550, %r2549, 65535; | |
shl.b32 %r2551, %r2550, 6; | |
bfe.u32 %r2552, %r2549, 16, 6; | |
or.b32 %r791, %r2551, %r2552; | |
st.local.u32 [%rd1+520], %r791; | |
bfe.u32 %r2553, %r2546, 22, 6; | |
mul.wide.u32 %rd1080, %r2553, 28; | |
add.s64 %rd1081, %rd1077, %rd1080; | |
ld.global.u32 %r2554, [%rd1081]; | |
and.b32 %r2555, %r2554, 65535; | |
shl.b32 %r2556, %r2555, 6; | |
bfe.u32 %r2557, %r2554, 16, 6; | |
or.b32 %r5502, %r2556, %r2557; | |
st.local.u32 [%rd1+524], %r5502; | |
setp.le.u32 %p131, %r791, %r5502; | |
mov.u32 %r5501, %r791; | |
@%p131 bra BB0_260; | |
st.local.u32 [%rd1+520], %r5502; | |
st.local.u32 [%rd1+524], %r791; | |
mov.u32 %r5186, %r5502; | |
mov.u32 %r5502, %r791; | |
mov.u32 %r5501, %r5186; | |
BB0_260: | |
mov.u32 %r794, %r5501; | |
mov.u32 %r793, %r5502; | |
setp.le.u32 %p132, %r5495, %r794; | |
mov.u32 %r5497, %r794; | |
mov.u32 %r5498, %r793; | |
@%p132 bra BB0_262; | |
st.local.u32 [%rd1+512], %r794; | |
st.local.u32 [%rd1+520], %r5495; | |
st.local.u32 [%rd1+516], %r793; | |
st.local.u32 [%rd1+524], %r5496; | |
mov.u32 %r5183, %r5496; | |
mov.u32 %r5185, %r5495; | |
mov.u32 %r5496, %r793; | |
mov.u32 %r5495, %r794; | |
mov.u32 %r5497, %r5185; | |
mov.u32 %r5498, %r5183; | |
BB0_262: | |
mov.u32 %r5487, %r5495; | |
mov.u32 %r5488, %r5496; | |
mov.u32 %r5489, %r5497; | |
mov.u32 %r5490, %r5498; | |
mul.lo.s64 %rd1082, %rd67, 1792; | |
add.s64 %rd1083, %rd3, %rd1082; | |
bfe.u32 %r2558, %r785, 22, 6; | |
mul.wide.u32 %rd1084, %r2558, 28; | |
add.s64 %rd1085, %rd1083, %rd1084; | |
ld.global.u32 %r799, [%rd1085+-8]; | |
and.b32 %r2559, %r799, 65535; | |
cvt.u64.u32 %rd69, %r2559; | |
bfe.u32 %r2560, %r799, 16, 6; | |
mul.wide.u32 %rd1086, %r2559, 1792; | |
add.s64 %rd1087, %rd136, %rd1086; | |
mul.wide.u32 %rd1088, %r2560, 28; | |
add.s64 %rd1089, %rd1087, %rd1088; | |
ld.global.u32 %r2561, [%rd1089]; | |
and.b32 %r2562, %r2561, 65535; | |
bfe.u32 %r2563, %r2561, 16, 6; | |
mul.wide.u32 %rd1090, %r2562, 1792; | |
add.s64 %rd1091, %rd135, %rd1090; | |
mul.wide.u32 %rd1092, %r2563, 28; | |
add.s64 %rd1093, %rd1091, %rd1092; | |
ld.global.u32 %r2564, [%rd1093]; | |
and.b32 %r2565, %r2564, 65535; | |
shl.b32 %r2566, %r2565, 6; | |
bfe.u32 %r2567, %r2564, 16, 6; | |
or.b32 %r800, %r2566, %r2567; | |
st.local.u32 [%rd1+528], %r800; | |
bfe.u32 %r2568, %r2561, 22, 6; | |
mul.wide.u32 %rd1094, %r2568, 28; | |
add.s64 %rd1095, %rd1091, %rd1094; | |
ld.global.u32 %r2569, [%rd1095]; | |
and.b32 %r2570, %r2569, 65535; | |
shl.b32 %r2571, %r2570, 6; | |
bfe.u32 %r2572, %r2569, 16, 6; | |
or.b32 %r5508, %r2571, %r2572; | |
st.local.u32 [%rd1+532], %r5508; | |
setp.le.u32 %p133, %r800, %r5508; | |
mov.u32 %r5507, %r800; | |
@%p133 bra BB0_264; | |
st.local.u32 [%rd1+528], %r5508; | |
st.local.u32 [%rd1+532], %r800; | |
mov.u32 %r5200, %r5508; | |
mov.u32 %r5508, %r800; | |
mov.u32 %r5507, %r5200; | |
BB0_264: | |
mov.u32 %r5503, %r5507; | |
mov.u32 %r5504, %r5508; | |
bfe.u32 %r2573, %r799, 22, 6; | |
mul.lo.s64 %rd1096, %rd69, 1792; | |
add.s64 %rd1097, %rd136, %rd1096; | |
mul.wide.u32 %rd1098, %r2573, 28; | |
add.s64 %rd1099, %rd1097, %rd1098; | |
ld.global.u32 %r2574, [%rd1099]; | |
and.b32 %r2575, %r2574, 65535; | |
bfe.u32 %r2576, %r2574, 16, 6; | |
mul.wide.u32 %rd1100, %r2575, 1792; | |
add.s64 %rd1101, %rd135, %rd1100; | |
mul.wide.u32 %rd1102, %r2576, 28; | |
add.s64 %rd1103, %rd1101, %rd1102; | |
ld.global.u32 %r2577, [%rd1103]; | |
and.b32 %r2578, %r2577, 65535; | |
shl.b32 %r2579, %r2578, 6; | |
bfe.u32 %r2580, %r2577, 16, 6; | |
or.b32 %r804, %r2579, %r2580; | |
st.local.u32 [%rd1+536], %r804; | |
bfe.u32 %r2581, %r2574, 22, 6; | |
mul.wide.u32 %rd1104, %r2581, 28; | |
add.s64 %rd1105, %rd1101, %rd1104; | |
ld.global.u32 %r2582, [%rd1105]; | |
and.b32 %r2583, %r2582, 65535; | |
shl.b32 %r2584, %r2583, 6; | |
bfe.u32 %r2585, %r2582, 16, 6; | |
or.b32 %r5510, %r2584, %r2585; | |
st.local.u32 [%rd1+540], %r5510; | |
setp.le.u32 %p134, %r804, %r5510; | |
mov.u32 %r5509, %r804; | |
@%p134 bra BB0_266; | |
st.local.u32 [%rd1+536], %r5510; | |
st.local.u32 [%rd1+540], %r804; | |
mov.u32 %r5206, %r5510; | |
mov.u32 %r5510, %r804; | |
mov.u32 %r5509, %r5206; | |
BB0_266: | |
mov.u32 %r807, %r5509; | |
mov.u32 %r806, %r5510; | |
setp.le.u32 %p135, %r5503, %r807; | |
mov.u32 %r5505, %r807; | |
mov.u32 %r5506, %r806; | |
@%p135 bra BB0_268; | |
st.local.u32 [%rd1+528], %r807; | |
st.local.u32 [%rd1+536], %r5503; | |
st.local.u32 [%rd1+532], %r806; | |
st.local.u32 [%rd1+540], %r5504; | |
mov.u32 %r5203, %r5504; | |
mov.u32 %r5205, %r5503; | |
mov.u32 %r5504, %r806; | |
mov.u32 %r5503, %r807; | |
mov.u32 %r5505, %r5205; | |
mov.u32 %r5506, %r5203; | |
BB0_268: | |
mov.u32 %r811, %r5503; | |
mov.u32 %r810, %r5504; | |
mov.u32 %r809, %r5505; | |
mov.u32 %r808, %r5506; | |
setp.le.u32 %p136, %r5487, %r811; | |
mov.u32 %r5491, %r811; | |
mov.u32 %r5492, %r810; | |
mov.u32 %r5493, %r809; | |
mov.u32 %r5494, %r808; | |
@%p136 bra BB0_270; | |
st.local.u32 [%rd1+512], %r811; | |
st.local.u32 [%rd1+528], %r5487; | |
st.local.u32 [%rd1+516], %r810; | |
st.local.u32 [%rd1+532], %r5488; | |
st.local.u32 [%rd1+520], %r809; | |
st.local.u32 [%rd1+536], %r5489; | |
st.local.u32 [%rd1+524], %r808; | |
st.local.u32 [%rd1+540], %r5490; | |
mov.u32 %r5193, %r5490; | |
mov.u32 %r5195, %r5489; | |
mov.u32 %r5197, %r5488; | |
mov.u32 %r5199, %r5487; | |
mov.u32 %r5490, %r808; | |
mov.u32 %r5489, %r809; | |
mov.u32 %r5488, %r810; | |
mov.u32 %r5487, %r811; | |
mov.u32 %r5491, %r5199; | |
mov.u32 %r5492, %r5197; | |
mov.u32 %r5493, %r5195; | |
mov.u32 %r5494, %r5193; | |
BB0_270: | |
mov.u32 %r5471, %r5487; | |
mov.u32 %r5472, %r5488; | |
mov.u32 %r5473, %r5489; | |
mov.u32 %r5474, %r5490; | |
mov.u32 %r5475, %r5491; | |
mov.u32 %r5476, %r5492; | |
mov.u32 %r5477, %r5493; | |
mov.u32 %r5478, %r5494; | |
mul.lo.s64 %rd1106, %rd66, 1792; | |
add.s64 %rd1107, %rd136, %rd1106; | |
bfe.u32 %r2586, %r784, 22, 6; | |
mul.wide.u32 %rd1108, %r2586, 28; | |
add.s64 %rd1109, %rd1107, %rd1108; | |
ld.global.u32 %r820, [%rd1109+4]; | |
and.b32 %r2587, %r820, 65535; | |
mul.wide.u32 %rd1110, %r2587, 1792; | |
add.s64 %rd1111, %rd3, %rd1110; | |
cvt.u64.u32 %rd70, %r2587; | |
bfe.u32 %r2588, %r820, 16, 6; | |
mul.wide.u32 %rd1112, %r2588, 28; | |
add.s64 %rd1113, %rd1111, %rd1112; | |
ld.global.u32 %r821, [%rd1113+-8]; | |
and.b32 %r2589, %r821, 65535; | |
cvt.u64.u32 %rd71, %r2589; | |
bfe.u32 %r2590, %r821, 16, 6; | |
mul.wide.u32 %rd1114, %r2589, 1792; | |
add.s64 %rd1115, %rd136, %rd1114; | |
mul.wide.u32 %rd1116, %r2590, 28; | |
add.s64 %rd1117, %rd1115, %rd1116; | |
ld.global.u32 %r2591, [%rd1117]; | |
and.b32 %r2592, %r2591, 65535; | |
bfe.u32 %r2593, %r2591, 16, 6; | |
mul.wide.u32 %rd1118, %r2592, 1792; | |
add.s64 %rd1119, %rd135, %rd1118; | |
mul.wide.u32 %rd1120, %r2593, 28; | |
add.s64 %rd1121, %rd1119, %rd1120; | |
ld.global.u32 %r2594, [%rd1121]; | |
and.b32 %r2595, %r2594, 65535; | |
shl.b32 %r2596, %r2595, 6; | |
bfe.u32 %r2597, %r2594, 16, 6; | |
or.b32 %r822, %r2596, %r2597; | |
st.local.u32 [%rd1+544], %r822; | |
bfe.u32 %r2598, %r2591, 22, 6; | |
mul.wide.u32 %rd1122, %r2598, 28; | |
add.s64 %rd1123, %rd1119, %rd1122; | |
ld.global.u32 %r2599, [%rd1123]; | |
and.b32 %r2600, %r2599, 65535; | |
shl.b32 %r2601, %r2600, 6; | |
bfe.u32 %r2602, %r2599, 16, 6; | |
or.b32 %r5524, %r2601, %r2602; | |
st.local.u32 [%rd1+548], %r5524; | |
setp.le.u32 %p137, %r822, %r5524; | |
mov.u32 %r5523, %r822; | |
@%p137 bra BB0_272; | |
st.local.u32 [%rd1+544], %r5524; | |
st.local.u32 [%rd1+548], %r822; | |
mov.u32 %r5236, %r5524; | |
mov.u32 %r5524, %r822; | |
mov.u32 %r5523, %r5236; | |
BB0_272: | |
mov.u32 %r5519, %r5523; | |
mov.u32 %r5520, %r5524; | |
bfe.u32 %r2603, %r821, 22, 6; | |
mul.lo.s64 %rd1124, %rd71, 1792; | |
add.s64 %rd1125, %rd136, %rd1124; | |
mul.wide.u32 %rd1126, %r2603, 28; | |
add.s64 %rd1127, %rd1125, %rd1126; | |
ld.global.u32 %r2604, [%rd1127]; | |
and.b32 %r2605, %r2604, 65535; | |
bfe.u32 %r2606, %r2604, 16, 6; | |
mul.wide.u32 %rd1128, %r2605, 1792; | |
add.s64 %rd1129, %rd135, %rd1128; | |
mul.wide.u32 %rd1130, %r2606, 28; | |
add.s64 %rd1131, %rd1129, %rd1130; | |
ld.global.u32 %r2607, [%rd1131]; | |
and.b32 %r2608, %r2607, 65535; | |
shl.b32 %r2609, %r2608, 6; | |
bfe.u32 %r2610, %r2607, 16, 6; | |
or.b32 %r826, %r2609, %r2610; | |
st.local.u32 [%rd1+552], %r826; | |
bfe.u32 %r2611, %r2604, 22, 6; | |
mul.wide.u32 %rd1132, %r2611, 28; | |
add.s64 %rd1133, %rd1129, %rd1132; | |
ld.global.u32 %r2612, [%rd1133]; | |
and.b32 %r2613, %r2612, 65535; | |
shl.b32 %r2614, %r2613, 6; | |
bfe.u32 %r2615, %r2612, 16, 6; | |
or.b32 %r5526, %r2614, %r2615; | |
st.local.u32 [%rd1+556], %r5526; | |
setp.le.u32 %p138, %r826, %r5526; | |
mov.u32 %r5525, %r826; | |
@%p138 bra BB0_274; | |
st.local.u32 [%rd1+552], %r5526; | |
st.local.u32 [%rd1+556], %r826; | |
mov.u32 %r5242, %r5526; | |
mov.u32 %r5526, %r826; | |
mov.u32 %r5525, %r5242; | |
BB0_274: | |
mov.u32 %r829, %r5525; | |
mov.u32 %r828, %r5526; | |
setp.le.u32 %p139, %r5519, %r829; | |
mov.u32 %r5521, %r829; | |
mov.u32 %r5522, %r828; | |
@%p139 bra BB0_276; | |
st.local.u32 [%rd1+544], %r829; | |
st.local.u32 [%rd1+552], %r5519; | |
st.local.u32 [%rd1+548], %r828; | |
st.local.u32 [%rd1+556], %r5520; | |
mov.u32 %r5239, %r5520; | |
mov.u32 %r5241, %r5519; | |
mov.u32 %r5520, %r828; | |
mov.u32 %r5519, %r829; | |
mov.u32 %r5521, %r5241; | |
mov.u32 %r5522, %r5239; | |
BB0_276: | |
mov.u32 %r5511, %r5519; | |
mov.u32 %r5512, %r5520; | |
mov.u32 %r5513, %r5521; | |
mov.u32 %r5514, %r5522; | |
mul.lo.s64 %rd1134, %rd70, 1792; | |
add.s64 %rd1135, %rd3, %rd1134; | |
bfe.u32 %r2616, %r820, 22, 6; | |
mul.wide.u32 %rd1136, %r2616, 28; | |
add.s64 %rd1137, %rd1135, %rd1136; | |
ld.global.u32 %r834, [%rd1137+-8]; | |
and.b32 %r2617, %r834, 65535; | |
cvt.u64.u32 %rd72, %r2617; | |
bfe.u32 %r2618, %r834, 16, 6; | |
mul.wide.u32 %rd1138, %r2617, 1792; | |
add.s64 %rd1139, %rd136, %rd1138; | |
mul.wide.u32 %rd1140, %r2618, 28; | |
add.s64 %rd1141, %rd1139, %rd1140; | |
ld.global.u32 %r2619, [%rd1141]; | |
and.b32 %r2620, %r2619, 65535; | |
bfe.u32 %r2621, %r2619, 16, 6; | |
mul.wide.u32 %rd1142, %r2620, 1792; | |
add.s64 %rd1143, %rd135, %rd1142; | |
mul.wide.u32 %rd1144, %r2621, 28; | |
add.s64 %rd1145, %rd1143, %rd1144; | |
ld.global.u32 %r2622, [%rd1145]; | |
and.b32 %r2623, %r2622, 65535; | |
shl.b32 %r2624, %r2623, 6; | |
bfe.u32 %r2625, %r2622, 16, 6; | |
or.b32 %r835, %r2624, %r2625; | |
st.local.u32 [%rd1+560], %r835; | |
bfe.u32 %r2626, %r2619, 22, 6; | |
mul.wide.u32 %rd1146, %r2626, 28; | |
add.s64 %rd1147, %rd1143, %rd1146; | |
ld.global.u32 %r2627, [%rd1147]; | |
and.b32 %r2628, %r2627, 65535; | |
shl.b32 %r2629, %r2628, 6; | |
bfe.u32 %r2630, %r2627, 16, 6; | |
or.b32 %r5532, %r2629, %r2630; | |
st.local.u32 [%rd1+564], %r5532; | |
setp.le.u32 %p140, %r835, %r5532; | |
mov.u32 %r5531, %r835; | |
@%p140 bra BB0_278; | |
st.local.u32 [%rd1+560], %r5532; | |
st.local.u32 [%rd1+564], %r835; | |
mov.u32 %r5256, %r5532; | |
mov.u32 %r5532, %r835; | |
mov.u32 %r5531, %r5256; | |
BB0_278: | |
mov.u32 %r5527, %r5531; | |
mov.u32 %r5528, %r5532; | |
bfe.u32 %r2631, %r834, 22, 6; | |
mul.lo.s64 %rd1148, %rd72, 1792; | |
add.s64 %rd1149, %rd136, %rd1148; | |
mul.wide.u32 %rd1150, %r2631, 28; | |
add.s64 %rd1151, %rd1149, %rd1150; | |
ld.global.u32 %r2632, [%rd1151]; | |
and.b32 %r2633, %r2632, 65535; | |
bfe.u32 %r2634, %r2632, 16, 6; | |
mul.wide.u32 %rd1152, %r2633, 1792; | |
add.s64 %rd1153, %rd135, %rd1152; | |
mul.wide.u32 %rd1154, %r2634, 28; | |
add.s64 %rd1155, %rd1153, %rd1154; | |
ld.global.u32 %r2635, [%rd1155]; | |
and.b32 %r2636, %r2635, 65535; | |
shl.b32 %r2637, %r2636, 6; | |
bfe.u32 %r2638, %r2635, 16, 6; | |
or.b32 %r839, %r2637, %r2638; | |
st.local.u32 [%rd1+568], %r839; | |
bfe.u32 %r2639, %r2632, 22, 6; | |
mul.wide.u32 %rd1156, %r2639, 28; | |
add.s64 %rd1157, %rd1153, %rd1156; | |
ld.global.u32 %r2640, [%rd1157]; | |
and.b32 %r2641, %r2640, 65535; | |
shl.b32 %r2642, %r2641, 6; | |
bfe.u32 %r2643, %r2640, 16, 6; | |
or.b32 %r5534, %r2642, %r2643; | |
st.local.u32 [%rd1+572], %r5534; | |
setp.le.u32 %p141, %r839, %r5534; | |
mov.u32 %r5533, %r839; | |
@%p141 bra BB0_280; | |
st.local.u32 [%rd1+568], %r5534; | |
st.local.u32 [%rd1+572], %r839; | |
mov.u32 %r5262, %r5534; | |
mov.u32 %r5534, %r839; | |
mov.u32 %r5533, %r5262; | |
BB0_280: | |
mov.u32 %r842, %r5533; | |
mov.u32 %r841, %r5534; | |
setp.le.u32 %p142, %r5527, %r842; | |
mov.u32 %r5529, %r842; | |
mov.u32 %r5530, %r841; | |
@%p142 bra BB0_282; | |
st.local.u32 [%rd1+560], %r842; | |
st.local.u32 [%rd1+568], %r5527; | |
st.local.u32 [%rd1+564], %r841; | |
st.local.u32 [%rd1+572], %r5528; | |
mov.u32 %r5259, %r5528; | |
mov.u32 %r5261, %r5527; | |
mov.u32 %r5528, %r841; | |
mov.u32 %r5527, %r842; | |
mov.u32 %r5529, %r5261; | |
mov.u32 %r5530, %r5259; | |
BB0_282: | |
mov.u32 %r846, %r5527; | |
mov.u32 %r845, %r5528; | |
mov.u32 %r844, %r5529; | |
mov.u32 %r843, %r5530; | |
setp.le.u32 %p143, %r5511, %r846; | |
mov.u32 %r5515, %r846; | |
mov.u32 %r5516, %r845; | |
mov.u32 %r5517, %r844; | |
mov.u32 %r5518, %r843; | |
@%p143 bra BB0_284; | |
st.local.u32 [%rd1+544], %r846; | |
st.local.u32 [%rd1+560], %r5511; | |
st.local.u32 [%rd1+548], %r845; | |
st.local.u32 [%rd1+564], %r5512; | |
st.local.u32 [%rd1+552], %r844; | |
st.local.u32 [%rd1+568], %r5513; | |
st.local.u32 [%rd1+556], %r843; | |
st.local.u32 [%rd1+572], %r5514; | |
mov.u32 %r5249, %r5514; | |
mov.u32 %r5251, %r5513; | |
mov.u32 %r5253, %r5512; | |
mov.u32 %r5255, %r5511; | |
mov.u32 %r5514, %r843; | |
mov.u32 %r5513, %r844; | |
mov.u32 %r5512, %r845; | |
mov.u32 %r5511, %r846; | |
mov.u32 %r5515, %r5255; | |
mov.u32 %r5516, %r5253; | |
mov.u32 %r5517, %r5251; | |
mov.u32 %r5518, %r5249; | |
BB0_284: | |
mov.u32 %r854, %r5511; | |
mov.u32 %r853, %r5512; | |
mov.u32 %r852, %r5513; | |
mov.u32 %r851, %r5514; | |
mov.u32 %r850, %r5515; | |
mov.u32 %r849, %r5516; | |
mov.u32 %r848, %r5517; | |
mov.u32 %r847, %r5518; | |
setp.le.u32 %p144, %r5471, %r854; | |
mov.u32 %r5479, %r854; | |
mov.u32 %r5480, %r853; | |
mov.u32 %r5481, %r852; | |
mov.u32 %r5482, %r851; | |
mov.u32 %r5483, %r850; | |
mov.u32 %r5484, %r849; | |
mov.u32 %r5485, %r848; | |
mov.u32 %r5486, %r847; | |
@%p144 bra BB0_286; | |
st.local.u32 [%rd1+512], %r854; | |
st.local.u32 [%rd1+544], %r5471; | |
st.local.u32 [%rd1+516], %r853; | |
st.local.u32 [%rd1+548], %r5472; | |
st.local.u32 [%rd1+520], %r852; | |
st.local.u32 [%rd1+552], %r5473; | |
st.local.u32 [%rd1+524], %r851; | |
st.local.u32 [%rd1+556], %r5474; | |
st.local.u32 [%rd1+528], %r850; | |
st.local.u32 [%rd1+560], %r5475; | |
st.local.u32 [%rd1+532], %r849; | |
st.local.u32 [%rd1+564], %r5476; | |
st.local.u32 [%rd1+536], %r848; | |
st.local.u32 [%rd1+568], %r5477; | |
st.local.u32 [%rd1+540], %r847; | |
st.local.u32 [%rd1+572], %r5478; | |
mov.u32 %r5221, %r5478; | |
mov.u32 %r5223, %r5477; | |
mov.u32 %r5225, %r5476; | |
mov.u32 %r5227, %r5475; | |
mov.u32 %r5229, %r5474; | |
mov.u32 %r5231, %r5473; | |
mov.u32 %r5233, %r5472; | |
mov.u32 %r5235, %r5471; | |
mov.u32 %r5478, %r847; | |
mov.u32 %r5477, %r848; | |
mov.u32 %r5476, %r849; | |
mov.u32 %r5475, %r850; | |
mov.u32 %r5474, %r851; | |
mov.u32 %r5473, %r852; | |
mov.u32 %r5472, %r853; | |
mov.u32 %r5471, %r854; | |
mov.u32 %r5479, %r5235; | |
mov.u32 %r5480, %r5233; | |
mov.u32 %r5481, %r5231; | |
mov.u32 %r5482, %r5229; | |
mov.u32 %r5483, %r5227; | |
mov.u32 %r5484, %r5225; | |
mov.u32 %r5485, %r5223; | |
mov.u32 %r5486, %r5221; | |
BB0_286: | |
mov.u32 %r870, %r5471; | |
mul.lo.s64 %rd1158, %rd65, 1792; | |
add.s64 %rd1159, %rd3, %rd1158; | |
bfe.u32 %r2644, %r783, 22, 6; | |
mul.wide.u32 %rd1160, %r2644, 28; | |
add.s64 %rd1161, %rd1159, %rd1160; | |
ld.global.u32 %r871, [%rd1161+-4]; | |
and.b32 %r2645, %r871, 65535; | |
mul.wide.u32 %rd1162, %r2645, 1792; | |
add.s64 %rd1163, %rd136, %rd1162; | |
bfe.u32 %r2646, %r871, 16, 6; | |
mul.wide.u32 %rd1164, %r2646, 28; | |
add.s64 %rd1165, %rd1163, %rd1164; | |
ld.global.u32 %r872, [%rd1165+4]; | |
and.b32 %r2647, %r872, 65535; | |
mul.wide.u32 %rd1166, %r2647, 1792; | |
add.s64 %rd1167, %rd3, %rd1166; | |
cvt.u64.u32 %rd73, %r2645; | |
cvt.u64.u32 %rd74, %r2647; | |
bfe.u32 %r2648, %r872, 16, 6; | |
mul.wide.u32 %rd1168, %r2648, 28; | |
add.s64 %rd1169, %rd1167, %rd1168; | |
ld.global.u32 %r873, [%rd1169+-8]; | |
and.b32 %r2649, %r873, 65535; | |
cvt.u64.u32 %rd75, %r2649; | |
bfe.u32 %r2650, %r873, 16, 6; | |
mul.wide.u32 %rd1170, %r2649, 1792; | |
add.s64 %rd1171, %rd136, %rd1170; | |
mul.wide.u32 %rd1172, %r2650, 28; | |
add.s64 %rd1173, %rd1171, %rd1172; | |
ld.global.u32 %r2651, [%rd1173]; | |
and.b32 %r2652, %r2651, 65535; | |
bfe.u32 %r2653, %r2651, 16, 6; | |
mul.wide.u32 %rd1174, %r2652, 1792; | |
add.s64 %rd1175, %rd135, %rd1174; | |
mul.wide.u32 %rd1176, %r2653, 28; | |
add.s64 %rd1177, %rd1175, %rd1176; | |
ld.global.u32 %r2654, [%rd1177]; | |
and.b32 %r2655, %r2654, 65535; | |
shl.b32 %r2656, %r2655, 6; | |
bfe.u32 %r2657, %r2654, 16, 6; | |
or.b32 %r874, %r2656, %r2657; | |
st.local.u32 [%rd1+576], %r874; | |
bfe.u32 %r2658, %r2651, 22, 6; | |
mul.wide.u32 %rd1178, %r2658, 28; | |
add.s64 %rd1179, %rd1175, %rd1178; | |
ld.global.u32 %r2659, [%rd1179]; | |
and.b32 %r2660, %r2659, 65535; | |
shl.b32 %r2661, %r2660, 6; | |
bfe.u32 %r2662, %r2659, 16, 6; | |
or.b32 %r5436, %r2661, %r2662; | |
st.local.u32 [%rd1+580], %r5436; | |
setp.le.u32 %p145, %r874, %r5436; | |
mov.u32 %r5435, %r874; | |
@%p145 bra BB0_288; | |
st.local.u32 [%rd1+576], %r5436; | |
st.local.u32 [%rd1+580], %r874; | |
mov.u32 %r5293, %r5436; | |
mov.u32 %r5436, %r874; | |
mov.u32 %r5435, %r5293; | |
BB0_288: | |
mov.u32 %r5431, %r5435; | |
mov.u32 %r5432, %r5436; | |
bfe.u32 %r2663, %r873, 22, 6; | |
mul.lo.s64 %rd1180, %rd75, 1792; | |
add.s64 %rd1181, %rd136, %rd1180; | |
mul.wide.u32 %rd1182, %r2663, 28; | |
add.s64 %rd1183, %rd1181, %rd1182; | |
ld.global.u32 %r2664, [%rd1183]; | |
and.b32 %r2665, %r2664, 65535; | |
bfe.u32 %r2666, %r2664, 16, 6; | |
mul.wide.u32 %rd1184, %r2665, 1792; | |
add.s64 %rd1185, %rd135, %rd1184; | |
mul.wide.u32 %rd1186, %r2666, 28; | |
add.s64 %rd1187, %rd1185, %rd1186; | |
ld.global.u32 %r2667, [%rd1187]; | |
and.b32 %r2668, %r2667, 65535; | |
shl.b32 %r2669, %r2668, 6; | |
bfe.u32 %r2670, %r2667, 16, 6; | |
or.b32 %r878, %r2669, %r2670; | |
st.local.u32 [%rd1+584], %r878; | |
bfe.u32 %r2671, %r2664, 22, 6; | |
mul.wide.u32 %rd1188, %r2671, 28; | |
add.s64 %rd1189, %rd1185, %rd1188; | |
ld.global.u32 %r2672, [%rd1189]; | |
and.b32 %r2673, %r2672, 65535; | |
shl.b32 %r2674, %r2673, 6; | |
bfe.u32 %r2675, %r2672, 16, 6; | |
or.b32 %r5438, %r2674, %r2675; | |
st.local.u32 [%rd1+588], %r5438; | |
setp.le.u32 %p146, %r878, %r5438; | |
mov.u32 %r5437, %r878; | |
@%p146 bra BB0_290; | |
st.local.u32 [%rd1+584], %r5438; | |
st.local.u32 [%rd1+588], %r878; | |
mov.u32 %r5299, %r5438; | |
mov.u32 %r5438, %r878; | |
mov.u32 %r5437, %r5299; | |
BB0_290: | |
mov.u32 %r881, %r5437; | |
mov.u32 %r880, %r5438; | |
setp.le.u32 %p147, %r5431, %r881; | |
mov.u32 %r5433, %r881; | |
mov.u32 %r5434, %r880; | |
@%p147 bra BB0_292; | |
st.local.u32 [%rd1+576], %r881; | |
st.local.u32 [%rd1+584], %r5431; | |
st.local.u32 [%rd1+580], %r880; | |
st.local.u32 [%rd1+588], %r5432; | |
mov.u32 %r5296, %r5432; | |
mov.u32 %r5298, %r5431; | |
mov.u32 %r5432, %r880; | |
mov.u32 %r5431, %r881; | |
mov.u32 %r5433, %r5298; | |
mov.u32 %r5434, %r5296; | |
BB0_292: | |
mov.u32 %r5423, %r5431; | |
mov.u32 %r5424, %r5432; | |
mov.u32 %r5425, %r5433; | |
mov.u32 %r5426, %r5434; | |
mul.lo.s64 %rd1190, %rd74, 1792; | |
add.s64 %rd1191, %rd3, %rd1190; | |
bfe.u32 %r2676, %r872, 22, 6; | |
mul.wide.u32 %rd1192, %r2676, 28; | |
add.s64 %rd1193, %rd1191, %rd1192; | |
ld.global.u32 %r886, [%rd1193+-8]; | |
and.b32 %r2677, %r886, 65535; | |
cvt.u64.u32 %rd76, %r2677; | |
bfe.u32 %r2678, %r886, 16, 6; | |
mul.wide.u32 %rd1194, %r2677, 1792; | |
add.s64 %rd1195, %rd136, %rd1194; | |
mul.wide.u32 %rd1196, %r2678, 28; | |
add.s64 %rd1197, %rd1195, %rd1196; | |
ld.global.u32 %r2679, [%rd1197]; | |
and.b32 %r2680, %r2679, 65535; | |
bfe.u32 %r2681, %r2679, 16, 6; | |
mul.wide.u32 %rd1198, %r2680, 1792; | |
add.s64 %rd1199, %rd135, %rd1198; | |
mul.wide.u32 %rd1200, %r2681, 28; | |
add.s64 %rd1201, %rd1199, %rd1200; | |
ld.global.u32 %r2682, [%rd1201]; | |
and.b32 %r2683, %r2682, 65535; | |
shl.b32 %r2684, %r2683, 6; | |
bfe.u32 %r2685, %r2682, 16, 6; | |
or.b32 %r887, %r2684, %r2685; | |
st.local.u32 [%rd1+592], %r887; | |
bfe.u32 %r2686, %r2679, 22, 6; | |
mul.wide.u32 %rd1202, %r2686, 28; | |
add.s64 %rd1203, %rd1199, %rd1202; | |
ld.global.u32 %r2687, [%rd1203]; | |
and.b32 %r2688, %r2687, 65535; | |
shl.b32 %r2689, %r2688, 6; | |
bfe.u32 %r2690, %r2687, 16, 6; | |
or.b32 %r5444, %r2689, %r2690; | |
st.local.u32 [%rd1+596], %r5444; | |
setp.le.u32 %p148, %r887, %r5444; | |
mov.u32 %r5443, %r887; | |
@%p148 bra BB0_294; | |
st.local.u32 [%rd1+592], %r5444; | |
st.local.u32 [%rd1+596], %r887; | |
mov.u32 %r5313, %r5444; | |
mov.u32 %r5444, %r887; | |
mov.u32 %r5443, %r5313; | |
BB0_294: | |
mov.u32 %r5439, %r5443; | |
mov.u32 %r5440, %r5444; | |
bfe.u32 %r2691, %r886, 22, 6; | |
mul.lo.s64 %rd1204, %rd76, 1792; | |
add.s64 %rd1205, %rd136, %rd1204; | |
mul.wide.u32 %rd1206, %r2691, 28; | |
add.s64 %rd1207, %rd1205, %rd1206; | |
ld.global.u32 %r2692, [%rd1207]; | |
and.b32 %r2693, %r2692, 65535; | |
bfe.u32 %r2694, %r2692, 16, 6; | |
mul.wide.u32 %rd1208, %r2693, 1792; | |
add.s64 %rd1209, %rd135, %rd1208; | |
mul.wide.u32 %rd1210, %r2694, 28; | |
add.s64 %rd1211, %rd1209, %rd1210; | |
ld.global.u32 %r2695, [%rd1211]; | |
and.b32 %r2696, %r2695, 65535; | |
shl.b32 %r2697, %r2696, 6; | |
bfe.u32 %r2698, %r2695, 16, 6; | |
or.b32 %r891, %r2697, %r2698; | |
st.local.u32 [%rd1+600], %r891; | |
bfe.u32 %r2699, %r2692, 22, 6; | |
mul.wide.u32 %rd1212, %r2699, 28; | |
add.s64 %rd1213, %rd1209, %rd1212; | |
ld.global.u32 %r2700, [%rd1213]; | |
and.b32 %r2701, %r2700, 65535; | |
shl.b32 %r2702, %r2701, 6; | |
bfe.u32 %r2703, %r2700, 16, 6; | |
or.b32 %r5446, %r2702, %r2703; | |
st.local.u32 [%rd1+604], %r5446; | |
setp.le.u32 %p149, %r891, %r5446; | |
mov.u32 %r5445, %r891; | |
@%p149 bra BB0_296; | |
st.local.u32 [%rd1+600], %r5446; | |
st.local.u32 [%rd1+604], %r891; | |
mov.u32 %r5319, %r5446; | |
mov.u32 %r5446, %r891; | |
mov.u32 %r5445, %r5319; | |
BB0_296: | |
mov.u32 %r894, %r5445; | |
mov.u32 %r893, %r5446; | |
setp.le.u32 %p150, %r5439, %r894; | |
mov.u32 %r5441, %r894; | |
mov.u32 %r5442, %r893; | |
@%p150 bra BB0_298; | |
st.local.u32 [%rd1+592], %r894; | |
st.local.u32 [%rd1+600], %r5439; | |
st.local.u32 [%rd1+596], %r893; | |
st.local.u32 [%rd1+604], %r5440; | |
mov.u32 %r5316, %r5440; | |
mov.u32 %r5318, %r5439; | |
mov.u32 %r5440, %r893; | |
mov.u32 %r5439, %r894; | |
mov.u32 %r5441, %r5318; | |
mov.u32 %r5442, %r5316; | |
BB0_298: | |
mov.u32 %r898, %r5439; | |
mov.u32 %r897, %r5440; | |
mov.u32 %r896, %r5441; | |
mov.u32 %r895, %r5442; | |
setp.le.u32 %p151, %r5423, %r898; | |
mov.u32 %r5427, %r898; | |
mov.u32 %r5428, %r897; | |
mov.u32 %r5429, %r896; | |
mov.u32 %r5430, %r895; | |
@%p151 bra BB0_300; | |
st.local.u32 [%rd1+576], %r898; | |
st.local.u32 [%rd1+592], %r5423; | |
st.local.u32 [%rd1+580], %r897; | |
st.local.u32 [%rd1+596], %r5424; | |
st.local.u32 [%rd1+584], %r896; | |
st.local.u32 [%rd1+600], %r5425; | |
st.local.u32 [%rd1+588], %r895; | |
st.local.u32 [%rd1+604], %r5426; | |
mov.u32 %r5306, %r5426; | |
mov.u32 %r5308, %r5425; | |
mov.u32 %r5310, %r5424; | |
mov.u32 %r5312, %r5423; | |
mov.u32 %r5426, %r895; | |
mov.u32 %r5425, %r896; | |
mov.u32 %r5424, %r897; | |
mov.u32 %r5423, %r898; | |
mov.u32 %r5427, %r5312; | |
mov.u32 %r5428, %r5310; | |
mov.u32 %r5429, %r5308; | |
mov.u32 %r5430, %r5306; | |
BB0_300: | |
mov.u32 %r5407, %r5423; | |
mov.u32 %r5408, %r5424; | |
mov.u32 %r5409, %r5425; | |
mov.u32 %r5410, %r5426; | |
mov.u32 %r5411, %r5427; | |
mov.u32 %r5412, %r5428; | |
mov.u32 %r5413, %r5429; | |
mov.u32 %r5414, %r5430; | |
mul.lo.s64 %rd1214, %rd73, 1792; | |
add.s64 %rd1215, %rd136, %rd1214; | |
bfe.u32 %r2704, %r871, 22, 6; | |
mul.wide.u32 %rd1216, %r2704, 28; | |
add.s64 %rd1217, %rd1215, %rd1216; | |
ld.global.u32 %r907, [%rd1217+4]; | |
and.b32 %r2705, %r907, 65535; | |
mul.wide.u32 %rd1218, %r2705, 1792; | |
add.s64 %rd1219, %rd3, %rd1218; | |
cvt.u64.u32 %rd77, %r2705; | |
bfe.u32 %r2706, %r907, 16, 6; | |
mul.wide.u32 %rd1220, %r2706, 28; | |
add.s64 %rd1221, %rd1219, %rd1220; | |
ld.global.u32 %r908, [%rd1221+-8]; | |
and.b32 %r2707, %r908, 65535; | |
cvt.u64.u32 %rd78, %r2707; | |
bfe.u32 %r2708, %r908, 16, 6; | |
mul.wide.u32 %rd1222, %r2707, 1792; | |
add.s64 %rd1223, %rd136, %rd1222; | |
mul.wide.u32 %rd1224, %r2708, 28; | |
add.s64 %rd1225, %rd1223, %rd1224; | |
ld.global.u32 %r2709, [%rd1225]; | |
and.b32 %r2710, %r2709, 65535; | |
bfe.u32 %r2711, %r2709, 16, 6; | |
mul.wide.u32 %rd1226, %r2710, 1792; | |
add.s64 %rd1227, %rd135, %rd1226; | |
mul.wide.u32 %rd1228, %r2711, 28; | |
add.s64 %rd1229, %rd1227, %rd1228; | |
ld.global.u32 %r2712, [%rd1229]; | |
and.b32 %r2713, %r2712, 65535; | |
shl.b32 %r2714, %r2713, 6; | |
bfe.u32 %r2715, %r2712, 16, 6; | |
or.b32 %r909, %r2714, %r2715; | |
st.local.u32 [%rd1+608], %r909; | |
bfe.u32 %r2716, %r2709, 22, 6; | |
mul.wide.u32 %rd1230, %r2716, 28; | |
add.s64 %rd1231, %rd1227, %rd1230; | |
ld.global.u32 %r2717, [%rd1231]; | |
and.b32 %r2718, %r2717, 65535; | |
shl.b32 %r2719, %r2718, 6; | |
bfe.u32 %r2720, %r2717, 16, 6; | |
or.b32 %r5460, %r2719, %r2720; | |
st.local.u32 [%rd1+612], %r5460; | |
setp.le.u32 %p152, %r909, %r5460; | |
mov.u32 %r5459, %r909; | |
@%p152 bra BB0_302; | |
st.local.u32 [%rd1+608], %r5460; | |
st.local.u32 [%rd1+612], %r909; | |
mov.u32 %r5349, %r5460; | |
mov.u32 %r5460, %r909; | |
mov.u32 %r5459, %r5349; | |
BB0_302: | |
mov.u32 %r5455, %r5459; | |
mov.u32 %r5456, %r5460; | |
bfe.u32 %r2721, %r908, 22, 6; | |
mul.lo.s64 %rd1232, %rd78, 1792; | |
add.s64 %rd1233, %rd136, %rd1232; | |
mul.wide.u32 %rd1234, %r2721, 28; | |
add.s64 %rd1235, %rd1233, %rd1234; | |
ld.global.u32 %r2722, [%rd1235]; | |
and.b32 %r2723, %r2722, 65535; | |
bfe.u32 %r2724, %r2722, 16, 6; | |
mul.wide.u32 %rd1236, %r2723, 1792; | |
add.s64 %rd1237, %rd135, %rd1236; | |
mul.wide.u32 %rd1238, %r2724, 28; | |
add.s64 %rd1239, %rd1237, %rd1238; | |
ld.global.u32 %r2725, [%rd1239]; | |
and.b32 %r2726, %r2725, 65535; | |
shl.b32 %r2727, %r2726, 6; | |
bfe.u32 %r2728, %r2725, 16, 6; | |
or.b32 %r913, %r2727, %r2728; | |
st.local.u32 [%rd1+616], %r913; | |
bfe.u32 %r2729, %r2722, 22, 6; | |
mul.wide.u32 %rd1240, %r2729, 28; | |
add.s64 %rd1241, %rd1237, %rd1240; | |
ld.global.u32 %r2730, [%rd1241]; | |
and.b32 %r2731, %r2730, 65535; | |
shl.b32 %r2732, %r2731, 6; | |
bfe.u32 %r2733, %r2730, 16, 6; | |
or.b32 %r5462, %r2732, %r2733; | |
st.local.u32 [%rd1+620], %r5462; | |
setp.le.u32 %p153, %r913, %r5462; | |
mov.u32 %r5461, %r913; | |
@%p153 bra BB0_304; | |
st.local.u32 [%rd1+616], %r5462; | |
st.local.u32 [%rd1+620], %r913; | |
mov.u32 %r5355, %r5462; | |
mov.u32 %r5462, %r913; | |
mov.u32 %r5461, %r5355; | |
BB0_304: | |
mov.u32 %r916, %r5461; | |
mov.u32 %r915, %r5462; | |
setp.le.u32 %p154, %r5455, %r916; | |
mov.u32 %r5457, %r916; | |
mov.u32 %r5458, %r915; | |
@%p154 bra BB0_306; | |
st.local.u32 [%rd1+608], %r916; | |
st.local.u32 [%rd1+616], %r5455; | |
st.local.u32 [%rd1+612], %r915; | |
st.local.u32 [%rd1+620], %r5456; | |
mov.u32 %r5352, %r5456; | |
mov.u32 %r5354, %r5455; | |
mov.u32 %r5456, %r915; | |
mov.u32 %r5455, %r916; | |
mov.u32 %r5457, %r5354; | |
mov.u32 %r5458, %r5352; | |
BB0_306: | |
mov.u32 %r5447, %r5455; | |
mov.u32 %r5448, %r5456; | |
mov.u32 %r5449, %r5457; | |
mov.u32 %r5450, %r5458; | |
mul.lo.s64 %rd1242, %rd77, 1792; | |
add.s64 %rd1243, %rd3, %rd1242; | |
bfe.u32 %r2734, %r907, 22, 6; | |
mul.wide.u32 %rd1244, %r2734, 28; | |
add.s64 %rd1245, %rd1243, %rd1244; | |
ld.global.u32 %r921, [%rd1245+-8]; | |
and.b32 %r2735, %r921, 65535; | |
cvt.u64.u32 %rd79, %r2735; | |
bfe.u32 %r2736, %r921, 16, 6; | |
mul.wide.u32 %rd1246, %r2735, 1792; | |
add.s64 %rd1247, %rd136, %rd1246; | |
mul.wide.u32 %rd1248, %r2736, 28; | |
add.s64 %rd1249, %rd1247, %rd1248; | |
ld.global.u32 %r2737, [%rd1249]; | |
and.b32 %r2738, %r2737, 65535; | |
bfe.u32 %r2739, %r2737, 16, 6; | |
mul.wide.u32 %rd1250, %r2738, 1792; | |
add.s64 %rd1251, %rd135, %rd1250; | |
mul.wide.u32 %rd1252, %r2739, 28; | |
add.s64 %rd1253, %rd1251, %rd1252; | |
ld.global.u32 %r2740, [%rd1253]; | |
and.b32 %r2741, %r2740, 65535; | |
shl.b32 %r2742, %r2741, 6; | |
bfe.u32 %r2743, %r2740, 16, 6; | |
or.b32 %r922, %r2742, %r2743; | |
st.local.u32 [%rd1+624], %r922; | |
bfe.u32 %r2744, %r2737, 22, 6; | |
mul.wide.u32 %rd1254, %r2744, 28; | |
add.s64 %rd1255, %rd1251, %rd1254; | |
ld.global.u32 %r2745, [%rd1255]; | |
and.b32 %r2746, %r2745, 65535; | |
shl.b32 %r2747, %r2746, 6; | |
bfe.u32 %r2748, %r2745, 16, 6; | |
or.b32 %r5468, %r2747, %r2748; | |
st.local.u32 [%rd1+628], %r5468; | |
setp.le.u32 %p155, %r922, %r5468; | |
mov.u32 %r5467, %r922; | |
@%p155 bra BB0_308; | |
st.local.u32 [%rd1+624], %r5468; | |
st.local.u32 [%rd1+628], %r922; | |
mov.u32 %r5369, %r5468; | |
mov.u32 %r5468, %r922; | |
mov.u32 %r5467, %r5369; | |
BB0_308: | |
mov.u32 %r5463, %r5467; | |
mov.u32 %r5464, %r5468; | |
bfe.u32 %r2749, %r921, 22, 6; | |
mul.lo.s64 %rd1256, %rd79, 1792; | |
add.s64 %rd1257, %rd136, %rd1256; | |
mul.wide.u32 %rd1258, %r2749, 28; | |
add.s64 %rd1259, %rd1257, %rd1258; | |
ld.global.u32 %r2750, [%rd1259]; | |
and.b32 %r2751, %r2750, 65535; | |
bfe.u32 %r2752, %r2750, 16, 6; | |
mul.wide.u32 %rd1260, %r2751, 1792; | |
add.s64 %rd1261, %rd135, %rd1260; | |
mul.wide.u32 %rd1262, %r2752, 28; | |
add.s64 %rd1263, %rd1261, %rd1262; | |
ld.global.u32 %r2753, [%rd1263]; | |
and.b32 %r2754, %r2753, 65535; | |
shl.b32 %r2755, %r2754, 6; | |
bfe.u32 %r2756, %r2753, 16, 6; | |
or.b32 %r926, %r2755, %r2756; | |
st.local.u32 [%rd1+632], %r926; | |
bfe.u32 %r2757, %r2750, 22, 6; | |
mul.wide.u32 %rd1264, %r2757, 28; | |
add.s64 %rd1265, %rd1261, %rd1264; | |
ld.global.u32 %r2758, [%rd1265]; | |
and.b32 %r2759, %r2758, 65535; | |
shl.b32 %r2760, %r2759, 6; | |
bfe.u32 %r2761, %r2758, 16, 6; | |
or.b32 %r5470, %r2760, %r2761; | |
st.local.u32 [%rd1+636], %r5470; | |
setp.le.u32 %p156, %r926, %r5470; | |
mov.u32 %r5469, %r926; | |
@%p156 bra BB0_310; | |
st.local.u32 [%rd1+632], %r5470; | |
st.local.u32 [%rd1+636], %r926; | |
mov.u32 %r5375, %r5470; | |
mov.u32 %r5470, %r926; | |
mov.u32 %r5469, %r5375; | |
BB0_310: | |
mov.u32 %r929, %r5469; | |
mov.u32 %r928, %r5470; | |
setp.le.u32 %p157, %r5463, %r929; | |
mov.u32 %r5465, %r929; | |
mov.u32 %r5466, %r928; | |
@%p157 bra BB0_312; | |
st.local.u32 [%rd1+624], %r929; | |
st.local.u32 [%rd1+632], %r5463; | |
st.local.u32 [%rd1+628], %r928; | |
st.local.u32 [%rd1+636], %r5464; | |
mov.u32 %r5372, %r5464; | |
mov.u32 %r5374, %r5463; | |
mov.u32 %r5464, %r928; | |
mov.u32 %r5463, %r929; | |
mov.u32 %r5465, %r5374; | |
mov.u32 %r5466, %r5372; | |
BB0_312: | |
mov.u32 %r933, %r5463; | |
mov.u32 %r932, %r5464; | |
mov.u32 %r931, %r5465; | |
mov.u32 %r930, %r5466; | |
setp.le.u32 %p158, %r5447, %r933; | |
mov.u32 %r5451, %r933; | |
mov.u32 %r5452, %r932; | |
mov.u32 %r5453, %r931; | |
mov.u32 %r5454, %r930; | |
@%p158 bra BB0_314; | |
st.local.u32 [%rd1+608], %r933; | |
st.local.u32 [%rd1+624], %r5447; | |
st.local.u32 [%rd1+612], %r932; | |
st.local.u32 [%rd1+628], %r5448; | |
st.local.u32 [%rd1+616], %r931; | |
st.local.u32 [%rd1+632], %r5449; | |
st.local.u32 [%rd1+620], %r930; | |
st.local.u32 [%rd1+636], %r5450; | |
mov.u32 %r5362, %r5450; | |
mov.u32 %r5364, %r5449; | |
mov.u32 %r5366, %r5448; | |
mov.u32 %r5368, %r5447; | |
mov.u32 %r5450, %r930; | |
mov.u32 %r5449, %r931; | |
mov.u32 %r5448, %r932; | |
mov.u32 %r5447, %r933; | |
mov.u32 %r5451, %r5368; | |
mov.u32 %r5452, %r5366; | |
mov.u32 %r5453, %r5364; | |
mov.u32 %r5454, %r5362; | |
BB0_314: | |
mov.u32 %r941, %r5447; | |
mov.u32 %r940, %r5448; | |
mov.u32 %r939, %r5449; | |
mov.u32 %r938, %r5450; | |
mov.u32 %r937, %r5451; | |
mov.u32 %r936, %r5452; | |
mov.u32 %r935, %r5453; | |
mov.u32 %r934, %r5454; | |
setp.le.u32 %p159, %r5407, %r941; | |
mov.u32 %r5415, %r941; | |
mov.u32 %r5416, %r940; | |
mov.u32 %r5417, %r939; | |
mov.u32 %r5418, %r938; | |
mov.u32 %r5419, %r937; | |
mov.u32 %r5420, %r936; | |
mov.u32 %r5421, %r935; | |
mov.u32 %r5422, %r934; | |
@%p159 bra BB0_316; | |
st.local.u32 [%rd1+576], %r941; | |
st.local.u32 [%rd1+608], %r5407; | |
st.local.u32 [%rd1+580], %r940; | |
st.local.u32 [%rd1+612], %r5408; | |
st.local.u32 [%rd1+584], %r939; | |
st.local.u32 [%rd1+616], %r5409; | |
st.local.u32 [%rd1+588], %r938; | |
st.local.u32 [%rd1+620], %r5410; | |
st.local.u32 [%rd1+592], %r937; | |
st.local.u32 [%rd1+624], %r5411; | |
st.local.u32 [%rd1+596], %r936; | |
st.local.u32 [%rd1+628], %r5412; | |
st.local.u32 [%rd1+600], %r935; | |
st.local.u32 [%rd1+632], %r5413; | |
st.local.u32 [%rd1+604], %r934; | |
st.local.u32 [%rd1+636], %r5414; | |
mov.u32 %r5334, %r5414; | |
mov.u32 %r5336, %r5413; | |
mov.u32 %r5338, %r5412; | |
mov.u32 %r5340, %r5411; | |
mov.u32 %r5342, %r5410; | |
mov.u32 %r5344, %r5409; | |
mov.u32 %r5346, %r5408; | |
mov.u32 %r5348, %r5407; | |
mov.u32 %r5414, %r934; | |
mov.u32 %r5413, %r935; | |
mov.u32 %r5412, %r936; | |
mov.u32 %r5411, %r937; | |
mov.u32 %r5410, %r938; | |
mov.u32 %r5409, %r939; | |
mov.u32 %r5408, %r940; | |
mov.u32 %r5407, %r941; | |
mov.u32 %r5415, %r5348; | |
mov.u32 %r5416, %r5346; | |
mov.u32 %r5417, %r5344; | |
mov.u32 %r5418, %r5342; | |
mov.u32 %r5419, %r5340; | |
mov.u32 %r5420, %r5338; | |
mov.u32 %r5421, %r5336; | |
mov.u32 %r5422, %r5334; | |
BB0_316: | |
mov.u32 %r957, %r5407; | |
setp.le.u32 %p160, %r870, %r957; | |
mov.u32 %r5406, %r870; | |
@%p160 bra BB0_318; | |
st.local.u32 [%rd1+512], %r957; | |
st.local.u32 [%rd1+576], %r870; | |
st.local.u32 [%rd1+516], %r5408; | |
st.local.u32 [%rd1+580], %r5472; | |
st.local.u32 [%rd1+520], %r5409; | |
st.local.u32 [%rd1+584], %r5473; | |
st.local.u32 [%rd1+524], %r5410; | |
st.local.u32 [%rd1+588], %r5474; | |
st.local.u32 [%rd1+528], %r5411; | |
st.local.u32 [%rd1+592], %r5475; | |
st.local.u32 [%rd1+532], %r5412; | |
st.local.u32 [%rd1+596], %r5476; | |
st.local.u32 [%rd1+536], %r5413; | |
st.local.u32 [%rd1+600], %r5477; | |
st.local.u32 [%rd1+540], %r5414; | |
st.local.u32 [%rd1+604], %r5478; | |
st.local.u32 [%rd1+544], %r5415; | |
st.local.u32 [%rd1+608], %r5479; | |
st.local.u32 [%rd1+548], %r5416; | |
st.local.u32 [%rd1+612], %r5480; | |
st.local.u32 [%rd1+552], %r5417; | |
st.local.u32 [%rd1+616], %r5481; | |
st.local.u32 [%rd1+556], %r5418; | |
st.local.u32 [%rd1+620], %r5482; | |
st.local.u32 [%rd1+560], %r5419; | |
st.local.u32 [%rd1+624], %r5483; | |
st.local.u32 [%rd1+564], %r5420; | |
st.local.u32 [%rd1+628], %r5484; | |
st.local.u32 [%rd1+568], %r5421; | |
st.local.u32 [%rd1+632], %r5485; | |
st.local.u32 [%rd1+572], %r5422; | |
st.local.u32 [%rd1+636], %r5486; | |
mov.u32 %r5406, %r957; | |
BB0_318: | |
mul.lo.s64 %rd1267, %rd64, 1792; | |
add.s64 %rd1268, %rd146, %rd1267; | |
bfe.u32 %r2762, %r782, 22, 6; | |
mul.wide.u32 %rd1269, %r2762, 28; | |
add.s64 %rd1270, %rd1268, %rd1269; | |
ld.global.u32 %r959, [%rd1270+4]; | |
and.b32 %r2763, %r959, 65535; | |
mul.wide.u32 %rd1271, %r2763, 1792; | |
add.s64 %rd1272, %rd3, %rd1271; | |
bfe.u32 %r2764, %r959, 16, 6; | |
mul.wide.u32 %rd1273, %r2764, 28; | |
add.s64 %rd1274, %rd1272, %rd1273; | |
ld.global.u32 %r960, [%rd1274+-4]; | |
and.b32 %r2765, %r960, 65535; | |
bfe.u32 %r2766, %r960, 16, 6; | |
mul.wide.u32 %rd1275, %r2765, 1792; | |
add.s64 %rd1276, %rd146, %rd1275; | |
mul.wide.u32 %rd1277, %r2766, 28; | |
add.s64 %rd1278, %rd1276, %rd1277; | |
ld.global.u32 %r961, [%rd1278]; | |
and.b32 %r2767, %r961, 65535; | |
mul.wide.u32 %rd1279, %r2767, 1792; | |
add.s64 %rd1280, %rd3, %rd1279; | |
cvt.u64.u32 %rd80, %r2763; | |
cvt.u64.u32 %rd81, %r2765; | |
cvt.u64.u32 %rd82, %r2767; | |
bfe.u32 %r2768, %r961, 16, 6; | |
mul.wide.u32 %rd1281, %r2768, 28; | |
add.s64 %rd1282, %rd1280, %rd1281; | |
ld.global.u32 %r962, [%rd1282+-8]; | |
and.b32 %r2769, %r962, 65535; | |
cvt.u64.u32 %rd83, %r2769; | |
bfe.u32 %r2770, %r962, 16, 6; | |
mul.wide.u32 %rd1283, %r2769, 1792; | |
add.s64 %rd1284, %rd136, %rd1283; | |
mul.wide.u32 %rd1285, %r2770, 28; | |
add.s64 %rd1286, %rd1284, %rd1285; | |
ld.global.u32 %r2771, [%rd1286]; | |
and.b32 %r2772, %r2771, 65535; | |
bfe.u32 %r2773, %r2771, 16, 6; | |
mul.wide.u32 %rd1287, %r2772, 1792; | |
add.s64 %rd1288, %rd135, %rd1287; | |
mul.wide.u32 %rd1289, %r2773, 28; | |
add.s64 %rd1290, %rd1288, %rd1289; | |
ld.global.u32 %r2774, [%rd1290]; | |
and.b32 %r2775, %r2774, 65535; | |
shl.b32 %r2776, %r2775, 6; | |
bfe.u32 %r2777, %r2774, 16, 6; | |
or.b32 %r963, %r2776, %r2777; | |
st.local.u32 [%rd1+640], %r963; | |
bfe.u32 %r2778, %r2771, 22, 6; | |
mul.wide.u32 %rd1291, %r2778, 28; | |
add.s64 %rd1292, %rd1288, %rd1291; | |
ld.global.u32 %r2779, [%rd1292]; | |
and.b32 %r2780, %r2779, 65535; | |
shl.b32 %r2781, %r2780, 6; | |
bfe.u32 %r2782, %r2779, 16, 6; | |
or.b32 %r5855, %r2781, %r2782; | |
st.local.u32 [%rd1+644], %r5855; | |
setp.le.u32 %p161, %r963, %r5855; | |
mov.u32 %r5854, %r963; | |
@%p161 bra BB0_320; | |
st.local.u32 [%rd1+640], %r5855; | |
st.local.u32 [%rd1+644], %r963; | |
mov.u32 %r5535, %r5855; | |
mov.u32 %r5855, %r963; | |
mov.u32 %r5854, %r5535; | |
BB0_320: | |
mov.u32 %r5850, %r5854; | |
mov.u32 %r5851, %r5855; | |
bfe.u32 %r2783, %r962, 22, 6; | |
mul.lo.s64 %rd1293, %rd83, 1792; | |
add.s64 %rd1294, %rd136, %rd1293; | |
mul.wide.u32 %rd1295, %r2783, 28; | |
add.s64 %rd1296, %rd1294, %rd1295; | |
ld.global.u32 %r2784, [%rd1296]; | |
and.b32 %r2785, %r2784, 65535; | |
bfe.u32 %r2786, %r2784, 16, 6; | |
mul.wide.u32 %rd1297, %r2785, 1792; | |
add.s64 %rd1298, %rd135, %rd1297; | |
mul.wide.u32 %rd1299, %r2786, 28; | |
add.s64 %rd1300, %rd1298, %rd1299; | |
ld.global.u32 %r2787, [%rd1300]; | |
and.b32 %r2788, %r2787, 65535; | |
shl.b32 %r2789, %r2788, 6; | |
bfe.u32 %r2790, %r2787, 16, 6; | |
or.b32 %r967, %r2789, %r2790; | |
st.local.u32 [%rd1+648], %r967; | |
bfe.u32 %r2791, %r2784, 22, 6; | |
mul.wide.u32 %rd1301, %r2791, 28; | |
add.s64 %rd1302, %rd1298, %rd1301; | |
ld.global.u32 %r2792, [%rd1302]; | |
and.b32 %r2793, %r2792, 65535; | |
shl.b32 %r2794, %r2793, 6; | |
bfe.u32 %r2795, %r2792, 16, 6; | |
or.b32 %r5857, %r2794, %r2795; | |
st.local.u32 [%rd1+652], %r5857; | |
setp.le.u32 %p162, %r967, %r5857; | |
mov.u32 %r5856, %r967; | |
@%p162 bra BB0_322; | |
st.local.u32 [%rd1+648], %r5857; | |
st.local.u32 [%rd1+652], %r967; | |
mov.u32 %r5541, %r5857; | |
mov.u32 %r5857, %r967; | |
mov.u32 %r5856, %r5541; | |
BB0_322: | |
mov.u32 %r970, %r5856; | |
mov.u32 %r969, %r5857; | |
setp.le.u32 %p163, %r5850, %r970; | |
mov.u32 %r5852, %r970; | |
mov.u32 %r5853, %r969; | |
@%p163 bra BB0_324; | |
st.local.u32 [%rd1+640], %r970; | |
st.local.u32 [%rd1+648], %r5850; | |
st.local.u32 [%rd1+644], %r969; | |
st.local.u32 [%rd1+652], %r5851; | |
mov.u32 %r5538, %r5851; | |
mov.u32 %r5540, %r5850; | |
mov.u32 %r5851, %r969; | |
mov.u32 %r5850, %r970; | |
mov.u32 %r5852, %r5540; | |
mov.u32 %r5853, %r5538; | |
BB0_324: | |
mov.u32 %r5842, %r5850; | |
mov.u32 %r5843, %r5851; | |
mov.u32 %r5844, %r5852; | |
mov.u32 %r5845, %r5853; | |
mul.lo.s64 %rd1303, %rd82, 1792; | |
add.s64 %rd1304, %rd3, %rd1303; | |
bfe.u32 %r2796, %r961, 22, 6; | |
mul.wide.u32 %rd1305, %r2796, 28; | |
add.s64 %rd1306, %rd1304, %rd1305; | |
ld.global.u32 %r975, [%rd1306+-8]; | |
and.b32 %r2797, %r975, 65535; | |
cvt.u64.u32 %rd84, %r2797; | |
bfe.u32 %r2798, %r975, 16, 6; | |
mul.wide.u32 %rd1307, %r2797, 1792; | |
add.s64 %rd1308, %rd136, %rd1307; | |
mul.wide.u32 %rd1309, %r2798, 28; | |
add.s64 %rd1310, %rd1308, %rd1309; | |
ld.global.u32 %r2799, [%rd1310]; | |
and.b32 %r2800, %r2799, 65535; | |
bfe.u32 %r2801, %r2799, 16, 6; | |
mul.wide.u32 %rd1311, %r2800, 1792; | |
add.s64 %rd1312, %rd135, %rd1311; | |
mul.wide.u32 %rd1313, %r2801, 28; | |
add.s64 %rd1314, %rd1312, %rd1313; | |
ld.global.u32 %r2802, [%rd1314]; | |
and.b32 %r2803, %r2802, 65535; | |
shl.b32 %r2804, %r2803, 6; | |
bfe.u32 %r2805, %r2802, 16, 6; | |
or.b32 %r976, %r2804, %r2805; | |
st.local.u32 [%rd1+656], %r976; | |
bfe.u32 %r2806, %r2799, 22, 6; | |
mul.wide.u32 %rd1315, %r2806, 28; | |
add.s64 %rd1316, %rd1312, %rd1315; | |
ld.global.u32 %r2807, [%rd1316]; | |
and.b32 %r2808, %r2807, 65535; | |
shl.b32 %r2809, %r2808, 6; | |
bfe.u32 %r2810, %r2807, 16, 6; | |
or.b32 %r5863, %r2809, %r2810; | |
st.local.u32 [%rd1+660], %r5863; | |
setp.le.u32 %p164, %r976, %r5863; | |
mov.u32 %r5862, %r976; | |
@%p164 bra BB0_326; | |
st.local.u32 [%rd1+656], %r5863; | |
st.local.u32 [%rd1+660], %r976; | |
mov.u32 %r5555, %r5863; | |
mov.u32 %r5863, %r976; | |
mov.u32 %r5862, %r5555; | |
BB0_326: | |
mov.u32 %r5858, %r5862; | |
mov.u32 %r5859, %r5863; | |
bfe.u32 %r2811, %r975, 22, 6; | |
mul.lo.s64 %rd1317, %rd84, 1792; | |
add.s64 %rd1318, %rd136, %rd1317; | |
mul.wide.u32 %rd1319, %r2811, 28; | |
add.s64 %rd1320, %rd1318, %rd1319; | |
ld.global.u32 %r2812, [%rd1320]; | |
and.b32 %r2813, %r2812, 65535; | |
bfe.u32 %r2814, %r2812, 16, 6; | |
mul.wide.u32 %rd1321, %r2813, 1792; | |
add.s64 %rd1322, %rd135, %rd1321; | |
mul.wide.u32 %rd1323, %r2814, 28; | |
add.s64 %rd1324, %rd1322, %rd1323; | |
ld.global.u32 %r2815, [%rd1324]; | |
and.b32 %r2816, %r2815, 65535; | |
shl.b32 %r2817, %r2816, 6; | |
bfe.u32 %r2818, %r2815, 16, 6; | |
or.b32 %r980, %r2817, %r2818; | |
st.local.u32 [%rd1+664], %r980; | |
bfe.u32 %r2819, %r2812, 22, 6; | |
mul.wide.u32 %rd1325, %r2819, 28; | |
add.s64 %rd1326, %rd1322, %rd1325; | |
ld.global.u32 %r2820, [%rd1326]; | |
and.b32 %r2821, %r2820, 65535; | |
shl.b32 %r2822, %r2821, 6; | |
bfe.u32 %r2823, %r2820, 16, 6; | |
or.b32 %r5865, %r2822, %r2823; | |
st.local.u32 [%rd1+668], %r5865; | |
setp.le.u32 %p165, %r980, %r5865; | |
mov.u32 %r5864, %r980; | |
@%p165 bra BB0_328; | |
st.local.u32 [%rd1+664], %r5865; | |
st.local.u32 [%rd1+668], %r980; | |
mov.u32 %r5561, %r5865; | |
mov.u32 %r5865, %r980; | |
mov.u32 %r5864, %r5561; | |
BB0_328: | |
mov.u32 %r983, %r5864; | |
mov.u32 %r982, %r5865; | |
setp.le.u32 %p166, %r5858, %r983; | |
mov.u32 %r5860, %r983; | |
mov.u32 %r5861, %r982; | |
@%p166 bra BB0_330; | |
st.local.u32 [%rd1+656], %r983; | |
st.local.u32 [%rd1+664], %r5858; | |
st.local.u32 [%rd1+660], %r982; | |
st.local.u32 [%rd1+668], %r5859; | |
mov.u32 %r5558, %r5859; | |
mov.u32 %r5560, %r5858; | |
mov.u32 %r5859, %r982; | |
mov.u32 %r5858, %r983; | |
mov.u32 %r5860, %r5560; | |
mov.u32 %r5861, %r5558; | |
BB0_330: | |
mov.u32 %r987, %r5858; | |
mov.u32 %r986, %r5859; | |
mov.u32 %r985, %r5860; | |
mov.u32 %r984, %r5861; | |
setp.le.u32 %p167, %r5842, %r987; | |
mov.u32 %r5846, %r987; | |
mov.u32 %r5847, %r986; | |
mov.u32 %r5848, %r985; | |
mov.u32 %r5849, %r984; | |
@%p167 bra BB0_332; | |
st.local.u32 [%rd1+640], %r987; | |
st.local.u32 [%rd1+656], %r5842; | |
st.local.u32 [%rd1+644], %r986; | |
st.local.u32 [%rd1+660], %r5843; | |
st.local.u32 [%rd1+648], %r985; | |
st.local.u32 [%rd1+664], %r5844; | |
st.local.u32 [%rd1+652], %r984; | |
st.local.u32 [%rd1+668], %r5845; | |
mov.u32 %r5548, %r5845; | |
mov.u32 %r5550, %r5844; | |
mov.u32 %r5552, %r5843; | |
mov.u32 %r5554, %r5842; | |
mov.u32 %r5845, %r984; | |
mov.u32 %r5844, %r985; | |
mov.u32 %r5843, %r986; | |
mov.u32 %r5842, %r987; | |
mov.u32 %r5846, %r5554; | |
mov.u32 %r5847, %r5552; | |
mov.u32 %r5848, %r5550; | |
mov.u32 %r5849, %r5548; | |
BB0_332: | |
mov.u32 %r5826, %r5842; | |
mov.u32 %r5827, %r5843; | |
mov.u32 %r5828, %r5844; | |
mov.u32 %r5829, %r5845; | |
mov.u32 %r5830, %r5846; | |
mov.u32 %r5831, %r5847; | |
mov.u32 %r5832, %r5848; | |
mov.u32 %r5833, %r5849; | |
mul.lo.s64 %rd1327, %rd81, 1792; | |
add.s64 %rd1328, %rd136, %rd1327; | |
bfe.u32 %r2824, %r960, 22, 6; | |
mul.wide.u32 %rd1329, %r2824, 28; | |
add.s64 %rd1330, %rd1328, %rd1329; | |
ld.global.u32 %r996, [%rd1330+4]; | |
and.b32 %r2825, %r996, 65535; | |
mul.wide.u32 %rd1331, %r2825, 1792; | |
add.s64 %rd1332, %rd3, %rd1331; | |
cvt.u64.u32 %rd85, %r2825; | |
bfe.u32 %r2826, %r996, 16, 6; | |
mul.wide.u32 %rd1333, %r2826, 28; | |
add.s64 %rd1334, %rd1332, %rd1333; | |
ld.global.u32 %r997, [%rd1334+-8]; | |
and.b32 %r2827, %r997, 65535; | |
cvt.u64.u32 %rd86, %r2827; | |
bfe.u32 %r2828, %r997, 16, 6; | |
mul.wide.u32 %rd1335, %r2827, 1792; | |
add.s64 %rd1336, %rd136, %rd1335; | |
mul.wide.u32 %rd1337, %r2828, 28; | |
add.s64 %rd1338, %rd1336, %rd1337; | |
ld.global.u32 %r2829, [%rd1338]; | |
and.b32 %r2830, %r2829, 65535; | |
bfe.u32 %r2831, %r2829, 16, 6; | |
mul.wide.u32 %rd1339, %r2830, 1792; | |
add.s64 %rd1340, %rd135, %rd1339; | |
mul.wide.u32 %rd1341, %r2831, 28; | |
add.s64 %rd1342, %rd1340, %rd1341; | |
ld.global.u32 %r2832, [%rd1342]; | |
and.b32 %r2833, %r2832, 65535; | |
shl.b32 %r2834, %r2833, 6; | |
bfe.u32 %r2835, %r2832, 16, 6; | |
or.b32 %r998, %r2834, %r2835; | |
st.local.u32 [%rd1+672], %r998; | |
bfe.u32 %r2836, %r2829, 22, 6; | |
mul.wide.u32 %rd1343, %r2836, 28; | |
add.s64 %rd1344, %rd1340, %rd1343; | |
ld.global.u32 %r2837, [%rd1344]; | |
and.b32 %r2838, %r2837, 65535; | |
shl.b32 %r2839, %r2838, 6; | |
bfe.u32 %r2840, %r2837, 16, 6; | |
or.b32 %r5879, %r2839, %r2840; | |
st.local.u32 [%rd1+676], %r5879; | |
setp.le.u32 %p168, %r998, %r5879; | |
mov.u32 %r5878, %r998; | |
@%p168 bra BB0_334; | |
st.local.u32 [%rd1+672], %r5879; | |
st.local.u32 [%rd1+676], %r998; | |
mov.u32 %r5591, %r5879; | |
mov.u32 %r5879, %r998; | |
mov.u32 %r5878, %r5591; | |
BB0_334: | |
mov.u32 %r5874, %r5878; | |
mov.u32 %r5875, %r5879; | |
bfe.u32 %r2841, %r997, 22, 6; | |
mul.lo.s64 %rd1345, %rd86, 1792; | |
add.s64 %rd1346, %rd136, %rd1345; | |
mul.wide.u32 %rd1347, %r2841, 28; | |
add.s64 %rd1348, %rd1346, %rd1347; | |
ld.global.u32 %r2842, [%rd1348]; | |
and.b32 %r2843, %r2842, 65535; | |
bfe.u32 %r2844, %r2842, 16, 6; | |
mul.wide.u32 %rd1349, %r2843, 1792; | |
add.s64 %rd1350, %rd135, %rd1349; | |
mul.wide.u32 %rd1351, %r2844, 28; | |
add.s64 %rd1352, %rd1350, %rd1351; | |
ld.global.u32 %r2845, [%rd1352]; | |
and.b32 %r2846, %r2845, 65535; | |
shl.b32 %r2847, %r2846, 6; | |
bfe.u32 %r2848, %r2845, 16, 6; | |
or.b32 %r1002, %r2847, %r2848; | |
st.local.u32 [%rd1+680], %r1002; | |
bfe.u32 %r2849, %r2842, 22, 6; | |
mul.wide.u32 %rd1353, %r2849, 28; | |
add.s64 %rd1354, %rd1350, %rd1353; | |
ld.global.u32 %r2850, [%rd1354]; | |
and.b32 %r2851, %r2850, 65535; | |
shl.b32 %r2852, %r2851, 6; | |
bfe.u32 %r2853, %r2850, 16, 6; | |
or.b32 %r5881, %r2852, %r2853; | |
st.local.u32 [%rd1+684], %r5881; | |
setp.le.u32 %p169, %r1002, %r5881; | |
mov.u32 %r5880, %r1002; | |
@%p169 bra BB0_336; | |
st.local.u32 [%rd1+680], %r5881; | |
st.local.u32 [%rd1+684], %r1002; | |
mov.u32 %r5597, %r5881; | |
mov.u32 %r5881, %r1002; | |
mov.u32 %r5880, %r5597; | |
BB0_336: | |
mov.u32 %r1005, %r5880; | |
mov.u32 %r1004, %r5881; | |
setp.le.u32 %p170, %r5874, %r1005; | |
mov.u32 %r5876, %r1005; | |
mov.u32 %r5877, %r1004; | |
@%p170 bra BB0_338; | |
st.local.u32 [%rd1+672], %r1005; | |
st.local.u32 [%rd1+680], %r5874; | |
st.local.u32 [%rd1+676], %r1004; | |
st.local.u32 [%rd1+684], %r5875; | |
mov.u32 %r5594, %r5875; | |
mov.u32 %r5596, %r5874; | |
mov.u32 %r5875, %r1004; | |
mov.u32 %r5874, %r1005; | |
mov.u32 %r5876, %r5596; | |
mov.u32 %r5877, %r5594; | |
BB0_338: | |
mov.u32 %r5866, %r5874; | |
mov.u32 %r5867, %r5875; | |
mov.u32 %r5868, %r5876; | |
mov.u32 %r5869, %r5877; | |
mul.lo.s64 %rd1355, %rd85, 1792; | |
add.s64 %rd1356, %rd3, %rd1355; | |
bfe.u32 %r2854, %r996, 22, 6; | |
mul.wide.u32 %rd1357, %r2854, 28; | |
add.s64 %rd1358, %rd1356, %rd1357; | |
ld.global.u32 %r1010, [%rd1358+-8]; | |
and.b32 %r2855, %r1010, 65535; | |
cvt.u64.u32 %rd87, %r2855; | |
bfe.u32 %r2856, %r1010, 16, 6; | |
mul.wide.u32 %rd1359, %r2855, 1792; | |
add.s64 %rd1360, %rd136, %rd1359; | |
mul.wide.u32 %rd1361, %r2856, 28; | |
add.s64 %rd1362, %rd1360, %rd1361; | |
ld.global.u32 %r2857, [%rd1362]; | |
and.b32 %r2858, %r2857, 65535; | |
bfe.u32 %r2859, %r2857, 16, 6; | |
mul.wide.u32 %rd1363, %r2858, 1792; | |
add.s64 %rd1364, %rd135, %rd1363; | |
mul.wide.u32 %rd1365, %r2859, 28; | |
add.s64 %rd1366, %rd1364, %rd1365; | |
ld.global.u32 %r2860, [%rd1366]; | |
and.b32 %r2861, %r2860, 65535; | |
shl.b32 %r2862, %r2861, 6; | |
bfe.u32 %r2863, %r2860, 16, 6; | |
or.b32 %r1011, %r2862, %r2863; | |
st.local.u32 [%rd1+688], %r1011; | |
bfe.u32 %r2864, %r2857, 22, 6; | |
mul.wide.u32 %rd1367, %r2864, 28; | |
add.s64 %rd1368, %rd1364, %rd1367; | |
ld.global.u32 %r2865, [%rd1368]; | |
and.b32 %r2866, %r2865, 65535; | |
shl.b32 %r2867, %r2866, 6; | |
bfe.u32 %r2868, %r2865, 16, 6; | |
or.b32 %r5887, %r2867, %r2868; | |
st.local.u32 [%rd1+692], %r5887; | |
setp.le.u32 %p171, %r1011, %r5887; | |
mov.u32 %r5886, %r1011; | |
@%p171 bra BB0_340; | |
st.local.u32 [%rd1+688], %r5887; | |
st.local.u32 [%rd1+692], %r1011; | |
mov.u32 %r5611, %r5887; | |
mov.u32 %r5887, %r1011; | |
mov.u32 %r5886, %r5611; | |
BB0_340: | |
mov.u32 %r5882, %r5886; | |
mov.u32 %r5883, %r5887; | |
bfe.u32 %r2869, %r1010, 22, 6; | |
mul.lo.s64 %rd1369, %rd87, 1792; | |
add.s64 %rd1370, %rd136, %rd1369; | |
mul.wide.u32 %rd1371, %r2869, 28; | |
add.s64 %rd1372, %rd1370, %rd1371; | |
ld.global.u32 %r2870, [%rd1372]; | |
and.b32 %r2871, %r2870, 65535; | |
bfe.u32 %r2872, %r2870, 16, 6; | |
mul.wide.u32 %rd1373, %r2871, 1792; | |
add.s64 %rd1374, %rd135, %rd1373; | |
mul.wide.u32 %rd1375, %r2872, 28; | |
add.s64 %rd1376, %rd1374, %rd1375; | |
ld.global.u32 %r2873, [%rd1376]; | |
and.b32 %r2874, %r2873, 65535; | |
shl.b32 %r2875, %r2874, 6; | |
bfe.u32 %r2876, %r2873, 16, 6; | |
or.b32 %r1015, %r2875, %r2876; | |
st.local.u32 [%rd1+696], %r1015; | |
bfe.u32 %r2877, %r2870, 22, 6; | |
mul.wide.u32 %rd1377, %r2877, 28; | |
add.s64 %rd1378, %rd1374, %rd1377; | |
ld.global.u32 %r2878, [%rd1378]; | |
and.b32 %r2879, %r2878, 65535; | |
shl.b32 %r2880, %r2879, 6; | |
bfe.u32 %r2881, %r2878, 16, 6; | |
or.b32 %r5889, %r2880, %r2881; | |
st.local.u32 [%rd1+700], %r5889; | |
setp.le.u32 %p172, %r1015, %r5889; | |
mov.u32 %r5888, %r1015; | |
@%p172 bra BB0_342; | |
st.local.u32 [%rd1+696], %r5889; | |
st.local.u32 [%rd1+700], %r1015; | |
mov.u32 %r5617, %r5889; | |
mov.u32 %r5889, %r1015; | |
mov.u32 %r5888, %r5617; | |
BB0_342: | |
mov.u32 %r1018, %r5888; | |
mov.u32 %r1017, %r5889; | |
setp.le.u32 %p173, %r5882, %r1018; | |
mov.u32 %r5884, %r1018; | |
mov.u32 %r5885, %r1017; | |
@%p173 bra BB0_344; | |
st.local.u32 [%rd1+688], %r1018; | |
st.local.u32 [%rd1+696], %r5882; | |
st.local.u32 [%rd1+692], %r1017; | |
st.local.u32 [%rd1+700], %r5883; | |
mov.u32 %r5614, %r5883; | |
mov.u32 %r5616, %r5882; | |
mov.u32 %r5883, %r1017; | |
mov.u32 %r5882, %r1018; | |
mov.u32 %r5884, %r5616; | |
mov.u32 %r5885, %r5614; | |
BB0_344: | |
mov.u32 %r1022, %r5882; | |
mov.u32 %r1021, %r5883; | |
mov.u32 %r1020, %r5884; | |
mov.u32 %r1019, %r5885; | |
setp.le.u32 %p174, %r5866, %r1022; | |
mov.u32 %r5870, %r1022; | |
mov.u32 %r5871, %r1021; | |
mov.u32 %r5872, %r1020; | |
mov.u32 %r5873, %r1019; | |
@%p174 bra BB0_346; | |
st.local.u32 [%rd1+672], %r1022; | |
st.local.u32 [%rd1+688], %r5866; | |
st.local.u32 [%rd1+676], %r1021; | |
st.local.u32 [%rd1+692], %r5867; | |
st.local.u32 [%rd1+680], %r1020; | |
st.local.u32 [%rd1+696], %r5868; | |
st.local.u32 [%rd1+684], %r1019; | |
st.local.u32 [%rd1+700], %r5869; | |
mov.u32 %r5604, %r5869; | |
mov.u32 %r5606, %r5868; | |
mov.u32 %r5608, %r5867; | |
mov.u32 %r5610, %r5866; | |
mov.u32 %r5869, %r1019; | |
mov.u32 %r5868, %r1020; | |
mov.u32 %r5867, %r1021; | |
mov.u32 %r5866, %r1022; | |
mov.u32 %r5870, %r5610; | |
mov.u32 %r5871, %r5608; | |
mov.u32 %r5872, %r5606; | |
mov.u32 %r5873, %r5604; | |
BB0_346: | |
mov.u32 %r1030, %r5866; | |
mov.u32 %r1029, %r5867; | |
mov.u32 %r1028, %r5868; | |
mov.u32 %r1027, %r5869; | |
mov.u32 %r1026, %r5870; | |
mov.u32 %r1025, %r5871; | |
mov.u32 %r1024, %r5872; | |
mov.u32 %r1023, %r5873; | |
setp.le.u32 %p175, %r5826, %r1030; | |
mov.u32 %r5834, %r1030; | |
mov.u32 %r5835, %r1029; | |
mov.u32 %r5836, %r1028; | |
mov.u32 %r5837, %r1027; | |
mov.u32 %r5838, %r1026; | |
mov.u32 %r5839, %r1025; | |
mov.u32 %r5840, %r1024; | |
mov.u32 %r5841, %r1023; | |
@%p175 bra BB0_348; | |
st.local.u32 [%rd1+640], %r1030; | |
st.local.u32 [%rd1+672], %r5826; | |
st.local.u32 [%rd1+644], %r1029; | |
st.local.u32 [%rd1+676], %r5827; | |
st.local.u32 [%rd1+648], %r1028; | |
st.local.u32 [%rd1+680], %r5828; | |
st.local.u32 [%rd1+652], %r1027; | |
st.local.u32 [%rd1+684], %r5829; | |
st.local.u32 [%rd1+656], %r1026; | |
st.local.u32 [%rd1+688], %r5830; | |
st.local.u32 [%rd1+660], %r1025; | |
st.local.u32 [%rd1+692], %r5831; | |
st.local.u32 [%rd1+664], %r1024; | |
st.local.u32 [%rd1+696], %r5832; | |
st.local.u32 [%rd1+668], %r1023; | |
st.local.u32 [%rd1+700], %r5833; | |
mov.u32 %r5576, %r5833; | |
mov.u32 %r5578, %r5832; | |
mov.u32 %r5580, %r5831; | |
mov.u32 %r5582, %r5830; | |
mov.u32 %r5584, %r5829; | |
mov.u32 %r5586, %r5828; | |
mov.u32 %r5588, %r5827; | |
mov.u32 %r5590, %r5826; | |
mov.u32 %r5833, %r1023; | |
mov.u32 %r5832, %r1024; | |
mov.u32 %r5831, %r1025; | |
mov.u32 %r5830, %r1026; | |
mov.u32 %r5829, %r1027; | |
mov.u32 %r5828, %r1028; | |
mov.u32 %r5827, %r1029; | |
mov.u32 %r5826, %r1030; | |
mov.u32 %r5834, %r5590; | |
mov.u32 %r5835, %r5588; | |
mov.u32 %r5836, %r5586; | |
mov.u32 %r5837, %r5584; | |
mov.u32 %r5838, %r5582; | |
mov.u32 %r5839, %r5580; | |
mov.u32 %r5840, %r5578; | |
mov.u32 %r5841, %r5576; | |
BB0_348: | |
mov.u32 %r1046, %r5826; | |
mul.lo.s64 %rd1379, %rd80, 1792; | |
add.s64 %rd1380, %rd3, %rd1379; | |
bfe.u32 %r2882, %r959, 22, 6; | |
mul.wide.u32 %rd1381, %r2882, 28; | |
add.s64 %rd1382, %rd1380, %rd1381; | |
ld.global.u32 %r1047, [%rd1382+-4]; | |
and.b32 %r2883, %r1047, 65535; | |
mul.wide.u32 %rd1383, %r2883, 1792; | |
add.s64 %rd1384, %rd136, %rd1383; | |
bfe.u32 %r2884, %r1047, 16, 6; | |
mul.wide.u32 %rd1385, %r2884, 28; | |
add.s64 %rd1386, %rd1384, %rd1385; | |
ld.global.u32 %r1048, [%rd1386+4]; | |
and.b32 %r2885, %r1048, 65535; | |
mul.wide.u32 %rd1387, %r2885, 1792; | |
add.s64 %rd1388, %rd3, %rd1387; | |
cvt.u64.u32 %rd88, %r2883; | |
cvt.u64.u32 %rd89, %r2885; | |
bfe.u32 %r2886, %r1048, 16, 6; | |
mul.wide.u32 %rd1389, %r2886, 28; | |
add.s64 %rd1390, %rd1388, %rd1389; | |
ld.global.u32 %r1049, [%rd1390+-8]; | |
and.b32 %r2887, %r1049, 65535; | |
cvt.u64.u32 %rd90, %r2887; | |
bfe.u32 %r2888, %r1049, 16, 6; | |
mul.wide.u32 %rd1391, %r2887, 1792; | |
add.s64 %rd1392, %rd136, %rd1391; | |
mul.wide.u32 %rd1393, %r2888, 28; | |
add.s64 %rd1394, %rd1392, %rd1393; | |
ld.global.u32 %r2889, [%rd1394]; | |
and.b32 %r2890, %r2889, 65535; | |
bfe.u32 %r2891, %r2889, 16, 6; | |
mul.wide.u32 %rd1395, %r2890, 1792; | |
add.s64 %rd1396, %rd135, %rd1395; | |
mul.wide.u32 %rd1397, %r2891, 28; | |
add.s64 %rd1398, %rd1396, %rd1397; | |
ld.global.u32 %r2892, [%rd1398]; | |
and.b32 %r2893, %r2892, 65535; | |
shl.b32 %r2894, %r2893, 6; | |
bfe.u32 %r2895, %r2892, 16, 6; | |
or.b32 %r1050, %r2894, %r2895; | |
st.local.u32 [%rd1+704], %r1050; | |
bfe.u32 %r2896, %r2889, 22, 6; | |
mul.wide.u32 %rd1399, %r2896, 28; | |
add.s64 %rd1400, %rd1396, %rd1399; | |
ld.global.u32 %r2897, [%rd1400]; | |
and.b32 %r2898, %r2897, 65535; | |
shl.b32 %r2899, %r2898, 6; | |
bfe.u32 %r2900, %r2897, 16, 6; | |
or.b32 %r5791, %r2899, %r2900; | |
st.local.u32 [%rd1+708], %r5791; | |
setp.le.u32 %p176, %r1050, %r5791; | |
mov.u32 %r5790, %r1050; | |
@%p176 bra BB0_350; | |
st.local.u32 [%rd1+704], %r5791; | |
st.local.u32 [%rd1+708], %r1050; | |
mov.u32 %r5648, %r5791; | |
mov.u32 %r5791, %r1050; | |
mov.u32 %r5790, %r5648; | |
BB0_350: | |
mov.u32 %r5786, %r5790; | |
mov.u32 %r5787, %r5791; | |
bfe.u32 %r2901, %r1049, 22, 6; | |
mul.lo.s64 %rd1401, %rd90, 1792; | |
add.s64 %rd1402, %rd136, %rd1401; | |
mul.wide.u32 %rd1403, %r2901, 28; | |
add.s64 %rd1404, %rd1402, %rd1403; | |
ld.global.u32 %r2902, [%rd1404]; | |
and.b32 %r2903, %r2902, 65535; | |
bfe.u32 %r2904, %r2902, 16, 6; | |
mul.wide.u32 %rd1405, %r2903, 1792; | |
add.s64 %rd1406, %rd135, %rd1405; | |
mul.wide.u32 %rd1407, %r2904, 28; | |
add.s64 %rd1408, %rd1406, %rd1407; | |
ld.global.u32 %r2905, [%rd1408]; | |
and.b32 %r2906, %r2905, 65535; | |
shl.b32 %r2907, %r2906, 6; | |
bfe.u32 %r2908, %r2905, 16, 6; | |
or.b32 %r1054, %r2907, %r2908; | |
st.local.u32 [%rd1+712], %r1054; | |
bfe.u32 %r2909, %r2902, 22, 6; | |
mul.wide.u32 %rd1409, %r2909, 28; | |
add.s64 %rd1410, %rd1406, %rd1409; | |
ld.global.u32 %r2910, [%rd1410]; | |
and.b32 %r2911, %r2910, 65535; | |
shl.b32 %r2912, %r2911, 6; | |
bfe.u32 %r2913, %r2910, 16, 6; | |
or.b32 %r5793, %r2912, %r2913; | |
st.local.u32 [%rd1+716], %r5793; | |
setp.le.u32 %p177, %r1054, %r5793; | |
mov.u32 %r5792, %r1054; | |
@%p177 bra BB0_352; | |
st.local.u32 [%rd1+712], %r5793; | |
st.local.u32 [%rd1+716], %r1054; | |
mov.u32 %r5654, %r5793; | |
mov.u32 %r5793, %r1054; | |
mov.u32 %r5792, %r5654; | |
BB0_352: | |
mov.u32 %r1057, %r5792; | |
mov.u32 %r1056, %r5793; | |
setp.le.u32 %p178, %r5786, %r1057; | |
mov.u32 %r5788, %r1057; | |
mov.u32 %r5789, %r1056; | |
@%p178 bra BB0_354; | |
st.local.u32 [%rd1+704], %r1057; | |
st.local.u32 [%rd1+712], %r5786; | |
st.local.u32 [%rd1+708], %r1056; | |
st.local.u32 [%rd1+716], %r5787; | |
mov.u32 %r5651, %r5787; | |
mov.u32 %r5653, %r5786; | |
mov.u32 %r5787, %r1056; | |
mov.u32 %r5786, %r1057; | |
mov.u32 %r5788, %r5653; | |
mov.u32 %r5789, %r5651; | |
BB0_354: | |
mov.u32 %r5778, %r5786; | |
mov.u32 %r5779, %r5787; | |
mov.u32 %r5780, %r5788; | |
mov.u32 %r5781, %r5789; | |
mul.lo.s64 %rd1411, %rd89, 1792; | |
add.s64 %rd1412, %rd3, %rd1411; | |
bfe.u32 %r2914, %r1048, 22, 6; | |
mul.wide.u32 %rd1413, %r2914, 28; | |
add.s64 %rd1414, %rd1412, %rd1413; | |
ld.global.u32 %r1062, [%rd1414+-8]; | |
and.b32 %r2915, %r1062, 65535; | |
cvt.u64.u32 %rd91, %r2915; | |
bfe.u32 %r2916, %r1062, 16, 6; | |
mul.wide.u32 %rd1415, %r2915, 1792; | |
add.s64 %rd1416, %rd136, %rd1415; | |
mul.wide.u32 %rd1417, %r2916, 28; | |
add.s64 %rd1418, %rd1416, %rd1417; | |
ld.global.u32 %r2917, [%rd1418]; | |
and.b32 %r2918, %r2917, 65535; | |
bfe.u32 %r2919, %r2917, 16, 6; | |
mul.wide.u32 %rd1419, %r2918, 1792; | |
add.s64 %rd1420, %rd135, %rd1419; | |
mul.wide.u32 %rd1421, %r2919, 28; | |
add.s64 %rd1422, %rd1420, %rd1421; | |
ld.global.u32 %r2920, [%rd1422]; | |
and.b32 %r2921, %r2920, 65535; | |
shl.b32 %r2922, %r2921, 6; | |
bfe.u32 %r2923, %r2920, 16, 6; | |
or.b32 %r1063, %r2922, %r2923; | |
st.local.u32 [%rd1+720], %r1063; | |
bfe.u32 %r2924, %r2917, 22, 6; | |
mul.wide.u32 %rd1423, %r2924, 28; | |
add.s64 %rd1424, %rd1420, %rd1423; | |
ld.global.u32 %r2925, [%rd1424]; | |
and.b32 %r2926, %r2925, 65535; | |
shl.b32 %r2927, %r2926, 6; | |
bfe.u32 %r2928, %r2925, 16, 6; | |
or.b32 %r5799, %r2927, %r2928; | |
st.local.u32 [%rd1+724], %r5799; | |
setp.le.u32 %p179, %r1063, %r5799; | |
mov.u32 %r5798, %r1063; | |
@%p179 bra BB0_356; | |
st.local.u32 [%rd1+720], %r5799; | |
st.local.u32 [%rd1+724], %r1063; | |
mov.u32 %r5668, %r5799; | |
mov.u32 %r5799, %r1063; | |
mov.u32 %r5798, %r5668; | |
BB0_356: | |
mov.u32 %r5794, %r5798; | |
mov.u32 %r5795, %r5799; | |
bfe.u32 %r2929, %r1062, 22, 6; | |
mul.lo.s64 %rd1425, %rd91, 1792; | |
add.s64 %rd1426, %rd136, %rd1425; | |
mul.wide.u32 %rd1427, %r2929, 28; | |
add.s64 %rd1428, %rd1426, %rd1427; | |
ld.global.u32 %r2930, [%rd1428]; | |
and.b32 %r2931, %r2930, 65535; | |
bfe.u32 %r2932, %r2930, 16, 6; | |
mul.wide.u32 %rd1429, %r2931, 1792; | |
add.s64 %rd1430, %rd135, %rd1429; | |
mul.wide.u32 %rd1431, %r2932, 28; | |
add.s64 %rd1432, %rd1430, %rd1431; | |
ld.global.u32 %r2933, [%rd1432]; | |
and.b32 %r2934, %r2933, 65535; | |
shl.b32 %r2935, %r2934, 6; | |
bfe.u32 %r2936, %r2933, 16, 6; | |
or.b32 %r1067, %r2935, %r2936; | |
st.local.u32 [%rd1+728], %r1067; | |
bfe.u32 %r2937, %r2930, 22, 6; | |
mul.wide.u32 %rd1433, %r2937, 28; | |
add.s64 %rd1434, %rd1430, %rd1433; | |
ld.global.u32 %r2938, [%rd1434]; | |
and.b32 %r2939, %r2938, 65535; | |
shl.b32 %r2940, %r2939, 6; | |
bfe.u32 %r2941, %r2938, 16, 6; | |
or.b32 %r5801, %r2940, %r2941; | |
st.local.u32 [%rd1+732], %r5801; | |
setp.le.u32 %p180, %r1067, %r5801; | |
mov.u32 %r5800, %r1067; | |
@%p180 bra BB0_358; | |
st.local.u32 [%rd1+728], %r5801; | |
st.local.u32 [%rd1+732], %r1067; | |
mov.u32 %r5674, %r5801; | |
mov.u32 %r5801, %r1067; | |
mov.u32 %r5800, %r5674; | |
BB0_358: | |
mov.u32 %r1070, %r5800; | |
mov.u32 %r1069, %r5801; | |
setp.le.u32 %p181, %r5794, %r1070; | |
mov.u32 %r5796, %r1070; | |
mov.u32 %r5797, %r1069; | |
@%p181 bra BB0_360; | |
st.local.u32 [%rd1+720], %r1070; | |
st.local.u32 [%rd1+728], %r5794; | |
st.local.u32 [%rd1+724], %r1069; | |
st.local.u32 [%rd1+732], %r5795; | |
mov.u32 %r5671, %r5795; | |
mov.u32 %r5673, %r5794; | |
mov.u32 %r5795, %r1069; | |
mov.u32 %r5794, %r1070; | |
mov.u32 %r5796, %r5673; | |
mov.u32 %r5797, %r5671; | |
BB0_360: | |
mov.u32 %r1074, %r5794; | |
mov.u32 %r1073, %r5795; | |
mov.u32 %r1072, %r5796; | |
mov.u32 %r1071, %r5797; | |
setp.le.u32 %p182, %r5778, %r1074; | |
mov.u32 %r5782, %r1074; | |
mov.u32 %r5783, %r1073; | |
mov.u32 %r5784, %r1072; | |
mov.u32 %r5785, %r1071; | |
@%p182 bra BB0_362; | |
st.local.u32 [%rd1+704], %r1074; | |
st.local.u32 [%rd1+720], %r5778; | |
st.local.u32 [%rd1+708], %r1073; | |
st.local.u32 [%rd1+724], %r5779; | |
st.local.u32 [%rd1+712], %r1072; | |
st.local.u32 [%rd1+728], %r5780; | |
st.local.u32 [%rd1+716], %r1071; | |
st.local.u32 [%rd1+732], %r5781; | |
mov.u32 %r5661, %r5781; | |
mov.u32 %r5663, %r5780; | |
mov.u32 %r5665, %r5779; | |
mov.u32 %r5667, %r5778; | |
mov.u32 %r5781, %r1071; | |
mov.u32 %r5780, %r1072; | |
mov.u32 %r5779, %r1073; | |
mov.u32 %r5778, %r1074; | |
mov.u32 %r5782, %r5667; | |
mov.u32 %r5783, %r5665; | |
mov.u32 %r5784, %r5663; | |
mov.u32 %r5785, %r5661; | |
BB0_362: | |
mov.u32 %r5762, %r5778; | |
mov.u32 %r5763, %r5779; | |
mov.u32 %r5764, %r5780; | |
mov.u32 %r5765, %r5781; | |
mov.u32 %r5766, %r5782; | |
mov.u32 %r5767, %r5783; | |
mov.u32 %r5768, %r5784; | |
mov.u32 %r5769, %r5785; | |
mul.lo.s64 %rd1435, %rd88, 1792; | |
add.s64 %rd1436, %rd136, %rd1435; | |
bfe.u32 %r2942, %r1047, 22, 6; | |
mul.wide.u32 %rd1437, %r2942, 28; | |
add.s64 %rd1438, %rd1436, %rd1437; | |
ld.global.u32 %r1083, [%rd1438+4]; | |
and.b32 %r2943, %r1083, 65535; | |
mul.wide.u32 %rd1439, %r2943, 1792; | |
add.s64 %rd1440, %rd3, %rd1439; | |
cvt.u64.u32 %rd92, %r2943; | |
bfe.u32 %r2944, %r1083, 16, 6; | |
mul.wide.u32 %rd1441, %r2944, 28; | |
add.s64 %rd1442, %rd1440, %rd1441; | |
ld.global.u32 %r1084, [%rd1442+-8]; | |
and.b32 %r2945, %r1084, 65535; | |
cvt.u64.u32 %rd93, %r2945; | |
bfe.u32 %r2946, %r1084, 16, 6; | |
mul.wide.u32 %rd1443, %r2945, 1792; | |
add.s64 %rd1444, %rd136, %rd1443; | |
mul.wide.u32 %rd1445, %r2946, 28; | |
add.s64 %rd1446, %rd1444, %rd1445; | |
ld.global.u32 %r2947, [%rd1446]; | |
and.b32 %r2948, %r2947, 65535; | |
bfe.u32 %r2949, %r2947, 16, 6; | |
mul.wide.u32 %rd1447, %r2948, 1792; | |
add.s64 %rd1448, %rd135, %rd1447; | |
mul.wide.u32 %rd1449, %r2949, 28; | |
add.s64 %rd1450, %rd1448, %rd1449; | |
ld.global.u32 %r2950, [%rd1450]; | |
and.b32 %r2951, %r2950, 65535; | |
shl.b32 %r2952, %r2951, 6; | |
bfe.u32 %r2953, %r2950, 16, 6; | |
or.b32 %r1085, %r2952, %r2953; | |
st.local.u32 [%rd1+736], %r1085; | |
bfe.u32 %r2954, %r2947, 22, 6; | |
mul.wide.u32 %rd1451, %r2954, 28; | |
add.s64 %rd1452, %rd1448, %rd1451; | |
ld.global.u32 %r2955, [%rd1452]; | |
and.b32 %r2956, %r2955, 65535; | |
shl.b32 %r2957, %r2956, 6; | |
bfe.u32 %r2958, %r2955, 16, 6; | |
or.b32 %r5815, %r2957, %r2958; | |
st.local.u32 [%rd1+740], %r5815; | |
setp.le.u32 %p183, %r1085, %r5815; | |
mov.u32 %r5814, %r1085; | |
@%p183 bra BB0_364; | |
st.local.u32 [%rd1+736], %r5815; | |
st.local.u32 [%rd1+740], %r1085; | |
mov.u32 %r5704, %r5815; | |
mov.u32 %r5815, %r1085; | |
mov.u32 %r5814, %r5704; | |
BB0_364: | |
mov.u32 %r5810, %r5814; | |
mov.u32 %r5811, %r5815; | |
bfe.u32 %r2959, %r1084, 22, 6; | |
mul.lo.s64 %rd1453, %rd93, 1792; | |
add.s64 %rd1454, %rd136, %rd1453; | |
mul.wide.u32 %rd1455, %r2959, 28; | |
add.s64 %rd1456, %rd1454, %rd1455; | |
ld.global.u32 %r2960, [%rd1456]; | |
and.b32 %r2961, %r2960, 65535; | |
bfe.u32 %r2962, %r2960, 16, 6; | |
mul.wide.u32 %rd1457, %r2961, 1792; | |
add.s64 %rd1458, %rd135, %rd1457; | |
mul.wide.u32 %rd1459, %r2962, 28; | |
add.s64 %rd1460, %rd1458, %rd1459; | |
ld.global.u32 %r2963, [%rd1460]; | |
and.b32 %r2964, %r2963, 65535; | |
shl.b32 %r2965, %r2964, 6; | |
bfe.u32 %r2966, %r2963, 16, 6; | |
or.b32 %r1089, %r2965, %r2966; | |
st.local.u32 [%rd1+744], %r1089; | |
bfe.u32 %r2967, %r2960, 22, 6; | |
mul.wide.u32 %rd1461, %r2967, 28; | |
add.s64 %rd1462, %rd1458, %rd1461; | |
ld.global.u32 %r2968, [%rd1462]; | |
and.b32 %r2969, %r2968, 65535; | |
shl.b32 %r2970, %r2969, 6; | |
bfe.u32 %r2971, %r2968, 16, 6; | |
or.b32 %r5817, %r2970, %r2971; | |
st.local.u32 [%rd1+748], %r5817; | |
setp.le.u32 %p184, %r1089, %r5817; | |
mov.u32 %r5816, %r1089; | |
@%p184 bra BB0_366; | |
st.local.u32 [%rd1+744], %r5817; | |
st.local.u32 [%rd1+748], %r1089; | |
mov.u32 %r5710, %r5817; | |
mov.u32 %r5817, %r1089; | |
mov.u32 %r5816, %r5710; | |
BB0_366: | |
mov.u32 %r1092, %r5816; | |
mov.u32 %r1091, %r5817; | |
setp.le.u32 %p185, %r5810, %r1092; | |
mov.u32 %r5812, %r1092; | |
mov.u32 %r5813, %r1091; | |
@%p185 bra BB0_368; | |
st.local.u32 [%rd1+736], %r1092; | |
st.local.u32 [%rd1+744], %r5810; | |
st.local.u32 [%rd1+740], %r1091; | |
st.local.u32 [%rd1+748], %r5811; | |
mov.u32 %r5707, %r5811; | |
mov.u32 %r5709, %r5810; | |
mov.u32 %r5811, %r1091; | |
mov.u32 %r5810, %r1092; | |
mov.u32 %r5812, %r5709; | |
mov.u32 %r5813, %r5707; | |
BB0_368: | |
mov.u32 %r5802, %r5810; | |
mov.u32 %r5803, %r5811; | |
mov.u32 %r5804, %r5812; | |
mov.u32 %r5805, %r5813; | |
mul.lo.s64 %rd1463, %rd92, 1792; | |
add.s64 %rd1464, %rd3, %rd1463; | |
bfe.u32 %r2972, %r1083, 22, 6; | |
mul.wide.u32 %rd1465, %r2972, 28; | |
add.s64 %rd1466, %rd1464, %rd1465; | |
ld.global.u32 %r1097, [%rd1466+-8]; | |
and.b32 %r2973, %r1097, 65535; | |
cvt.u64.u32 %rd94, %r2973; | |
bfe.u32 %r2974, %r1097, 16, 6; | |
mul.wide.u32 %rd1467, %r2973, 1792; | |
add.s64 %rd1468, %rd136, %rd1467; | |
mul.wide.u32 %rd1469, %r2974, 28; | |
add.s64 %rd1470, %rd1468, %rd1469; | |
ld.global.u32 %r2975, [%rd1470]; | |
and.b32 %r2976, %r2975, 65535; | |
bfe.u32 %r2977, %r2975, 16, 6; | |
mul.wide.u32 %rd1471, %r2976, 1792; | |
add.s64 %rd1472, %rd135, %rd1471; | |
mul.wide.u32 %rd1473, %r2977, 28; | |
add.s64 %rd1474, %rd1472, %rd1473; | |
ld.global.u32 %r2978, [%rd1474]; | |
and.b32 %r2979, %r2978, 65535; | |
shl.b32 %r2980, %r2979, 6; | |
bfe.u32 %r2981, %r2978, 16, 6; | |
or.b32 %r1098, %r2980, %r2981; | |
st.local.u32 [%rd1+752], %r1098; | |
bfe.u32 %r2982, %r2975, 22, 6; | |
mul.wide.u32 %rd1475, %r2982, 28; | |
add.s64 %rd1476, %rd1472, %rd1475; | |
ld.global.u32 %r2983, [%rd1476]; | |
and.b32 %r2984, %r2983, 65535; | |
shl.b32 %r2985, %r2984, 6; | |
bfe.u32 %r2986, %r2983, 16, 6; | |
or.b32 %r5823, %r2985, %r2986; | |
st.local.u32 [%rd1+756], %r5823; | |
setp.le.u32 %p186, %r1098, %r5823; | |
mov.u32 %r5822, %r1098; | |
@%p186 bra BB0_370; | |
st.local.u32 [%rd1+752], %r5823; | |
st.local.u32 [%rd1+756], %r1098; | |
mov.u32 %r5724, %r5823; | |
mov.u32 %r5823, %r1098; | |
mov.u32 %r5822, %r5724; | |
BB0_370: | |
mov.u32 %r5818, %r5822; | |
mov.u32 %r5819, %r5823; | |
bfe.u32 %r2987, %r1097, 22, 6; | |
mul.lo.s64 %rd1477, %rd94, 1792; | |
add.s64 %rd1478, %rd136, %rd1477; | |
mul.wide.u32 %rd1479, %r2987, 28; | |
add.s64 %rd1480, %rd1478, %rd1479; | |
ld.global.u32 %r2988, [%rd1480]; | |
and.b32 %r2989, %r2988, 65535; | |
bfe.u32 %r2990, %r2988, 16, 6; | |
mul.wide.u32 %rd1481, %r2989, 1792; | |
add.s64 %rd1482, %rd135, %rd1481; | |
mul.wide.u32 %rd1483, %r2990, 28; | |
add.s64 %rd1484, %rd1482, %rd1483; | |
ld.global.u32 %r2991, [%rd1484]; | |
and.b32 %r2992, %r2991, 65535; | |
shl.b32 %r2993, %r2992, 6; | |
bfe.u32 %r2994, %r2991, 16, 6; | |
or.b32 %r1102, %r2993, %r2994; | |
st.local.u32 [%rd1+760], %r1102; | |
bfe.u32 %r2995, %r2988, 22, 6; | |
mul.wide.u32 %rd1485, %r2995, 28; | |
add.s64 %rd1486, %rd1482, %rd1485; | |
ld.global.u32 %r2996, [%rd1486]; | |
and.b32 %r2997, %r2996, 65535; | |
shl.b32 %r2998, %r2997, 6; | |
bfe.u32 %r2999, %r2996, 16, 6; | |
or.b32 %r5825, %r2998, %r2999; | |
st.local.u32 [%rd1+764], %r5825; | |
setp.le.u32 %p187, %r1102, %r5825; | |
mov.u32 %r5824, %r1102; | |
@%p187 bra BB0_372; | |
st.local.u32 [%rd1+760], %r5825; | |
st.local.u32 [%rd1+764], %r1102; | |
mov.u32 %r5730, %r5825; | |
mov.u32 %r5825, %r1102; | |
mov.u32 %r5824, %r5730; | |
BB0_372: | |
mov.u32 %r1105, %r5824; | |
mov.u32 %r1104, %r5825; | |
setp.le.u32 %p188, %r5818, %r1105; | |
mov.u32 %r5820, %r1105; | |
mov.u32 %r5821, %r1104; | |
@%p188 bra BB0_374; | |
st.local.u32 [%rd1+752], %r1105; | |
st.local.u32 [%rd1+760], %r5818; | |
st.local.u32 [%rd1+756], %r1104; | |
st.local.u32 [%rd1+764], %r5819; | |
mov.u32 %r5727, %r5819; | |
mov.u32 %r5729, %r5818; | |
mov.u32 %r5819, %r1104; | |
mov.u32 %r5818, %r1105; | |
mov.u32 %r5820, %r5729; | |
mov.u32 %r5821, %r5727; | |
BB0_374: | |
mov.u32 %r1109, %r5818; | |
mov.u32 %r1108, %r5819; | |
mov.u32 %r1107, %r5820; | |
mov.u32 %r1106, %r5821; | |
setp.le.u32 %p189, %r5802, %r1109; | |
mov.u32 %r5806, %r1109; | |
mov.u32 %r5807, %r1108; | |
mov.u32 %r5808, %r1107; | |
mov.u32 %r5809, %r1106; | |
@%p189 bra BB0_376; | |
st.local.u32 [%rd1+736], %r1109; | |
st.local.u32 [%rd1+752], %r5802; | |
st.local.u32 [%rd1+740], %r1108; | |
st.local.u32 [%rd1+756], %r5803; | |
st.local.u32 [%rd1+744], %r1107; | |
st.local.u32 [%rd1+760], %r5804; | |
st.local.u32 [%rd1+748], %r1106; | |
st.local.u32 [%rd1+764], %r5805; | |
mov.u32 %r5717, %r5805; | |
mov.u32 %r5719, %r5804; | |
mov.u32 %r5721, %r5803; | |
mov.u32 %r5723, %r5802; | |
mov.u32 %r5805, %r1106; | |
mov.u32 %r5804, %r1107; | |
mov.u32 %r5803, %r1108; | |
mov.u32 %r5802, %r1109; | |
mov.u32 %r5806, %r5723; | |
mov.u32 %r5807, %r5721; | |
mov.u32 %r5808, %r5719; | |
mov.u32 %r5809, %r5717; | |
BB0_376: | |
mov.u32 %r1117, %r5802; | |
mov.u32 %r1116, %r5803; | |
mov.u32 %r1115, %r5804; | |
mov.u32 %r1114, %r5805; | |
mov.u32 %r1113, %r5806; | |
mov.u32 %r1112, %r5807; | |
mov.u32 %r1111, %r5808; | |
mov.u32 %r1110, %r5809; | |
setp.le.u32 %p190, %r5762, %r1117; | |
mov.u32 %r5770, %r1117; | |
mov.u32 %r5771, %r1116; | |
mov.u32 %r5772, %r1115; | |
mov.u32 %r5773, %r1114; | |
mov.u32 %r5774, %r1113; | |
mov.u32 %r5775, %r1112; | |
mov.u32 %r5776, %r1111; | |
mov.u32 %r5777, %r1110; | |
@%p190 bra BB0_378; | |
st.local.u32 [%rd1+704], %r1117; | |
st.local.u32 [%rd1+736], %r5762; | |
st.local.u32 [%rd1+708], %r1116; | |
st.local.u32 [%rd1+740], %r5763; | |
st.local.u32 [%rd1+712], %r1115; | |
st.local.u32 [%rd1+744], %r5764; | |
st.local.u32 [%rd1+716], %r1114; | |
st.local.u32 [%rd1+748], %r5765; | |
st.local.u32 [%rd1+720], %r1113; | |
st.local.u32 [%rd1+752], %r5766; | |
st.local.u32 [%rd1+724], %r1112; | |
st.local.u32 [%rd1+756], %r5767; | |
st.local.u32 [%rd1+728], %r1111; | |
st.local.u32 [%rd1+760], %r5768; | |
st.local.u32 [%rd1+732], %r1110; | |
st.local.u32 [%rd1+764], %r5769; | |
mov.u32 %r5689, %r5769; | |
mov.u32 %r5691, %r5768; | |
mov.u32 %r5693, %r5767; | |
mov.u32 %r5695, %r5766; | |
mov.u32 %r5697, %r5765; | |
mov.u32 %r5699, %r5764; | |
mov.u32 %r5701, %r5763; | |
mov.u32 %r5703, %r5762; | |
mov.u32 %r5769, %r1110; | |
mov.u32 %r5768, %r1111; | |
mov.u32 %r5767, %r1112; | |
mov.u32 %r5766, %r1113; | |
mov.u32 %r5765, %r1114; | |
mov.u32 %r5764, %r1115; | |
mov.u32 %r5763, %r1116; | |
mov.u32 %r5762, %r1117; | |
mov.u32 %r5770, %r5703; | |
mov.u32 %r5771, %r5701; | |
mov.u32 %r5772, %r5699; | |
mov.u32 %r5773, %r5697; | |
mov.u32 %r5774, %r5695; | |
mov.u32 %r5775, %r5693; | |
mov.u32 %r5776, %r5691; | |
mov.u32 %r5777, %r5689; | |
BB0_378: | |
mov.u32 %r1133, %r5762; | |
setp.le.u32 %p191, %r1046, %r1133; | |
mov.u32 %r5761, %r1046; | |
@%p191 bra BB0_380; | |
st.local.u32 [%rd1+640], %r1133; | |
st.local.u32 [%rd1+704], %r1046; | |
st.local.u32 [%rd1+644], %r5763; | |
st.local.u32 [%rd1+708], %r5827; | |
st.local.u32 [%rd1+648], %r5764; | |
st.local.u32 [%rd1+712], %r5828; | |
st.local.u32 [%rd1+652], %r5765; | |
st.local.u32 [%rd1+716], %r5829; | |
st.local.u32 [%rd1+656], %r5766; | |
st.local.u32 [%rd1+720], %r5830; | |
st.local.u32 [%rd1+660], %r5767; | |
st.local.u32 [%rd1+724], %r5831; | |
st.local.u32 [%rd1+664], %r5768; | |
st.local.u32 [%rd1+728], %r5832; | |
st.local.u32 [%rd1+668], %r5769; | |
st.local.u32 [%rd1+732], %r5833; | |
st.local.u32 [%rd1+672], %r5770; | |
st.local.u32 [%rd1+736], %r5834; | |
st.local.u32 [%rd1+676], %r5771; | |
st.local.u32 [%rd1+740], %r5835; | |
st.local.u32 [%rd1+680], %r5772; | |
st.local.u32 [%rd1+744], %r5836; | |
st.local.u32 [%rd1+684], %r5773; | |
st.local.u32 [%rd1+748], %r5837; | |
st.local.u32 [%rd1+688], %r5774; | |
st.local.u32 [%rd1+752], %r5838; | |
st.local.u32 [%rd1+692], %r5775; | |
st.local.u32 [%rd1+756], %r5839; | |
st.local.u32 [%rd1+696], %r5776; | |
st.local.u32 [%rd1+760], %r5840; | |
st.local.u32 [%rd1+700], %r5777; | |
st.local.u32 [%rd1+764], %r5841; | |
mov.u32 %r5761, %r1133; | |
BB0_380: | |
mov.u32 %r5890, -32; | |
setp.le.u32 %p192, %r5406, %r5761; | |
@%p192 bra BB0_383; | |
mov.u64 %rd1940, %rd1; | |
BB0_382: | |
mov.u64 %rd95, %rd1940; | |
ld.local.u32 %r3001, [%rd95+512]; | |
ld.local.u32 %r3002, [%rd95+640]; | |
ld.local.u32 %r3003, [%rd95+516]; | |
ld.local.u32 %r3004, [%rd95+644]; | |
ld.local.u32 %r3005, [%rd95+520]; | |
ld.local.u32 %r3006, [%rd95+648]; | |
ld.local.u32 %r3007, [%rd95+524]; | |
ld.local.u32 %r3008, [%rd95+652]; | |
ld.local.u32 %r3009, [%rd95+528]; | |
ld.local.u32 %r3010, [%rd95+656]; | |
ld.local.u32 %r3011, [%rd95+532]; | |
ld.local.u32 %r3012, [%rd95+660]; | |
ld.local.u32 %r3013, [%rd95+536]; | |
ld.local.u32 %r3014, [%rd95+664]; | |
ld.local.u32 %r3015, [%rd95+540]; | |
ld.local.u32 %r3016, [%rd95+668]; | |
st.local.u32 [%rd95+512], %r3002; | |
st.local.u32 [%rd95+640], %r3001; | |
st.local.u32 [%rd95+516], %r3004; | |
st.local.u32 [%rd95+644], %r3003; | |
st.local.u32 [%rd95+520], %r3006; | |
st.local.u32 [%rd95+648], %r3005; | |
st.local.u32 [%rd95+524], %r3008; | |
st.local.u32 [%rd95+652], %r3007; | |
st.local.u32 [%rd95+528], %r3010; | |
st.local.u32 [%rd95+656], %r3009; | |
st.local.u32 [%rd95+532], %r3012; | |
st.local.u32 [%rd95+660], %r3011; | |
st.local.u32 [%rd95+536], %r3014; | |
st.local.u32 [%rd95+664], %r3013; | |
st.local.u32 [%rd95+540], %r3016; | |
st.local.u32 [%rd95+668], %r3015; | |
add.s64 %rd96, %rd95, 32; | |
add.s32 %r5890, %r5890, 8; | |
setp.ne.s32 %p193, %r5890, 0; | |
mov.u64 %rd1940, %rd96; | |
@%p193 bra BB0_382; | |
BB0_383: | |
bfe.u32 %r3017, %r781, 22, 6; | |
mul.lo.s64 %rd1488, %rd63, 1792; | |
add.s64 %rd1489, %rd3, %rd1488; | |
mul.wide.u32 %rd1490, %r3017, 28; | |
add.s64 %rd1491, %rd1489, %rd1490; | |
ld.global.u32 %r1137, [%rd1491]; | |
and.b32 %r3018, %r1137, 65535; | |
mul.wide.u32 %rd1492, %r3018, 1792; | |
add.s64 %rd1493, %rd146, %rd1492; | |
bfe.u32 %r3019, %r1137, 16, 6; | |
mul.wide.u32 %rd1494, %r3019, 28; | |
add.s64 %rd1495, %rd1493, %rd1494; | |
ld.global.u32 %r1138, [%rd1495+4]; | |
and.b32 %r3020, %r1138, 65535; | |
mul.wide.u32 %rd1496, %r3020, 1792; | |
add.s64 %rd1497, %rd3, %rd1496; | |
bfe.u32 %r3021, %r1138, 16, 6; | |
mul.wide.u32 %rd1498, %r3021, 28; | |
add.s64 %rd1499, %rd1497, %rd1498; | |
ld.global.u32 %r1139, [%rd1499+-4]; | |
and.b32 %r3022, %r1139, 65535; | |
bfe.u32 %r3023, %r1139, 16, 6; | |
mul.wide.u32 %rd1500, %r3022, 1792; | |
add.s64 %rd1501, %rd146, %rd1500; | |
mul.wide.u32 %rd1502, %r3023, 28; | |
add.s64 %rd1503, %rd1501, %rd1502; | |
ld.global.u32 %r1140, [%rd1503]; | |
and.b32 %r3024, %r1140, 65535; | |
mul.wide.u32 %rd1504, %r3024, 1792; | |
add.s64 %rd1505, %rd3, %rd1504; | |
cvt.u64.u32 %rd97, %r3018; | |
cvt.u64.u32 %rd98, %r3020; | |
cvt.u64.u32 %rd99, %r3022; | |
cvt.u64.u32 %rd100, %r3024; | |
bfe.u32 %r3025, %r1140, 16, 6; | |
mul.wide.u32 %rd1506, %r3025, 28; | |
add.s64 %rd1507, %rd1505, %rd1506; | |
ld.global.u32 %r1141, [%rd1507+-8]; | |
and.b32 %r3026, %r1141, 65535; | |
cvt.u64.u32 %rd101, %r3026; | |
bfe.u32 %r3027, %r1141, 16, 6; | |
mul.wide.u32 %rd1508, %r3026, 1792; | |
add.s64 %rd1509, %rd136, %rd1508; | |
mul.wide.u32 %rd1510, %r3027, 28; | |
add.s64 %rd1511, %rd1509, %rd1510; | |
ld.global.u32 %r3028, [%rd1511]; | |
and.b32 %r3029, %r3028, 65535; | |
bfe.u32 %r3030, %r3028, 16, 6; | |
mul.wide.u32 %rd1512, %r3029, 1792; | |
add.s64 %rd1513, %rd135, %rd1512; | |
mul.wide.u32 %rd1514, %r3030, 28; | |
add.s64 %rd1515, %rd1513, %rd1514; | |
ld.global.u32 %r3031, [%rd1515]; | |
and.b32 %r3032, %r3031, 65535; | |
shl.b32 %r3033, %r3032, 6; | |
bfe.u32 %r3034, %r3031, 16, 6; | |
or.b32 %r1142, %r3033, %r3034; | |
st.local.u32 [%rd1+768], %r1142; | |
bfe.u32 %r3035, %r3028, 22, 6; | |
mul.wide.u32 %rd1516, %r3035, 28; | |
add.s64 %rd1517, %rd1513, %rd1516; | |
ld.global.u32 %r3036, [%rd1517]; | |
and.b32 %r3037, %r3036, 65535; | |
shl.b32 %r3038, %r3037, 6; | |
bfe.u32 %r3039, %r3036, 16, 6; | |
or.b32 %r6569, %r3038, %r3039; | |
st.local.u32 [%rd1+772], %r6569; | |
setp.le.u32 %p194, %r1142, %r6569; | |
mov.u32 %r6568, %r1142; | |
@%p194 bra BB0_385; | |
st.local.u32 [%rd1+768], %r6569; | |
st.local.u32 [%rd1+772], %r1142; | |
mov.u32 %r6247, %r6569; | |
mov.u32 %r6569, %r1142; | |
mov.u32 %r6568, %r6247; | |
BB0_385: | |
mov.u32 %r6564, %r6568; | |
mov.u32 %r6565, %r6569; | |
bfe.u32 %r3040, %r1141, 22, 6; | |
mul.lo.s64 %rd1518, %rd101, 1792; | |
add.s64 %rd1519, %rd136, %rd1518; | |
mul.wide.u32 %rd1520, %r3040, 28; | |
add.s64 %rd1521, %rd1519, %rd1520; | |
ld.global.u32 %r3041, [%rd1521]; | |
and.b32 %r3042, %r3041, 65535; | |
bfe.u32 %r3043, %r3041, 16, 6; | |
mul.wide.u32 %rd1522, %r3042, 1792; | |
add.s64 %rd1523, %rd135, %rd1522; | |
mul.wide.u32 %rd1524, %r3043, 28; | |
add.s64 %rd1525, %rd1523, %rd1524; | |
ld.global.u32 %r3044, [%rd1525]; | |
and.b32 %r3045, %r3044, 65535; | |
shl.b32 %r3046, %r3045, 6; | |
bfe.u32 %r3047, %r3044, 16, 6; | |
or.b32 %r1146, %r3046, %r3047; | |
st.local.u32 [%rd1+776], %r1146; | |
bfe.u32 %r3048, %r3041, 22, 6; | |
mul.wide.u32 %rd1526, %r3048, 28; | |
add.s64 %rd1527, %rd1523, %rd1526; | |
ld.global.u32 %r3049, [%rd1527]; | |
and.b32 %r3050, %r3049, 65535; | |
shl.b32 %r3051, %r3050, 6; | |
bfe.u32 %r3052, %r3049, 16, 6; | |
or.b32 %r6571, %r3051, %r3052; | |
st.local.u32 [%rd1+780], %r6571; | |
setp.le.u32 %p195, %r1146, %r6571; | |
mov.u32 %r6570, %r1146; | |
@%p195 bra BB0_387; | |
st.local.u32 [%rd1+776], %r6571; | |
st.local.u32 [%rd1+780], %r1146; | |
mov.u32 %r6253, %r6571; | |
mov.u32 %r6571, %r1146; | |
mov.u32 %r6570, %r6253; | |
BB0_387: | |
mov.u32 %r1149, %r6570; | |
mov.u32 %r1148, %r6571; | |
setp.le.u32 %p196, %r6564, %r1149; | |
mov.u32 %r6566, %r1149; | |
mov.u32 %r6567, %r1148; | |
@%p196 bra BB0_389; | |
st.local.u32 [%rd1+768], %r1149; | |
st.local.u32 [%rd1+776], %r6564; | |
st.local.u32 [%rd1+772], %r1148; | |
st.local.u32 [%rd1+780], %r6565; | |
mov.u32 %r6250, %r6565; | |
mov.u32 %r6252, %r6564; | |
mov.u32 %r6565, %r1148; | |
mov.u32 %r6564, %r1149; | |
mov.u32 %r6566, %r6252; | |
mov.u32 %r6567, %r6250; | |
BB0_389: | |
mov.u32 %r6556, %r6564; | |
mov.u32 %r6557, %r6565; | |
mov.u32 %r6558, %r6566; | |
mov.u32 %r6559, %r6567; | |
mul.lo.s64 %rd1528, %rd100, 1792; | |
add.s64 %rd1529, %rd3, %rd1528; | |
bfe.u32 %r3053, %r1140, 22, 6; | |
mul.wide.u32 %rd1530, %r3053, 28; | |
add.s64 %rd1531, %rd1529, %rd1530; | |
ld.global.u32 %r1154, [%rd1531+-8]; | |
and.b32 %r3054, %r1154, 65535; | |
cvt.u64.u32 %rd102, %r3054; | |
bfe.u32 %r3055, %r1154, 16, 6; | |
mul.wide.u32 %rd1532, %r3054, 1792; | |
add.s64 %rd1533, %rd136, %rd1532; | |
mul.wide.u32 %rd1534, %r3055, 28; | |
add.s64 %rd1535, %rd1533, %rd1534; | |
ld.global.u32 %r3056, [%rd1535]; | |
and.b32 %r3057, %r3056, 65535; | |
bfe.u32 %r3058, %r3056, 16, 6; | |
mul.wide.u32 %rd1536, %r3057, 1792; | |
add.s64 %rd1537, %rd135, %rd1536; | |
mul.wide.u32 %rd1538, %r3058, 28; | |
add.s64 %rd1539, %rd1537, %rd1538; | |
ld.global.u32 %r3059, [%rd1539]; | |
and.b32 %r3060, %r3059, 65535; | |
shl.b32 %r3061, %r3060, 6; | |
bfe.u32 %r3062, %r3059, 16, 6; | |
or.b32 %r1155, %r3061, %r3062; | |
st.local.u32 [%rd1+784], %r1155; | |
bfe.u32 %r3063, %r3056, 22, 6; | |
mul.wide.u32 %rd1540, %r3063, 28; | |
add.s64 %rd1541, %rd1537, %rd1540; | |
ld.global.u32 %r3064, [%rd1541]; | |
and.b32 %r3065, %r3064, 65535; | |
shl.b32 %r3066, %r3065, 6; | |
bfe.u32 %r3067, %r3064, 16, 6; | |
or.b32 %r6577, %r3066, %r3067; | |
st.local.u32 [%rd1+788], %r6577; | |
setp.le.u32 %p197, %r1155, %r6577; | |
mov.u32 %r6576, %r1155; | |
@%p197 bra BB0_391; | |
st.local.u32 [%rd1+784], %r6577; | |
st.local.u32 [%rd1+788], %r1155; | |
mov.u32 %r6267, %r6577; | |
mov.u32 %r6577, %r1155; | |
mov.u32 %r6576, %r6267; | |
BB0_391: | |
mov.u32 %r6572, %r6576; | |
mov.u32 %r6573, %r6577; | |
bfe.u32 %r3068, %r1154, 22, 6; | |
mul.lo.s64 %rd1542, %rd102, 1792; | |
add.s64 %rd1543, %rd136, %rd1542; | |
mul.wide.u32 %rd1544, %r3068, 28; | |
add.s64 %rd1545, %rd1543, %rd1544; | |
ld.global.u32 %r3069, [%rd1545]; | |
and.b32 %r3070, %r3069, 65535; | |
bfe.u32 %r3071, %r3069, 16, 6; | |
mul.wide.u32 %rd1546, %r3070, 1792; | |
add.s64 %rd1547, %rd135, %rd1546; | |
mul.wide.u32 %rd1548, %r3071, 28; | |
add.s64 %rd1549, %rd1547, %rd1548; | |
ld.global.u32 %r3072, [%rd1549]; | |
and.b32 %r3073, %r3072, 65535; | |
shl.b32 %r3074, %r3073, 6; | |
bfe.u32 %r3075, %r3072, 16, 6; | |
or.b32 %r1159, %r3074, %r3075; | |
st.local.u32 [%rd1+792], %r1159; | |
bfe.u32 %r3076, %r3069, 22, 6; | |
mul.wide.u32 %rd1550, %r3076, 28; | |
add.s64 %rd1551, %rd1547, %rd1550; | |
ld.global.u32 %r3077, [%rd1551]; | |
and.b32 %r3078, %r3077, 65535; | |
shl.b32 %r3079, %r3078, 6; | |
bfe.u32 %r3080, %r3077, 16, 6; | |
or.b32 %r6579, %r3079, %r3080; | |
st.local.u32 [%rd1+796], %r6579; | |
setp.le.u32 %p198, %r1159, %r6579; | |
mov.u32 %r6578, %r1159; | |
@%p198 bra BB0_393; | |
st.local.u32 [%rd1+792], %r6579; | |
st.local.u32 [%rd1+796], %r1159; | |
mov.u32 %r6273, %r6579; | |
mov.u32 %r6579, %r1159; | |
mov.u32 %r6578, %r6273; | |
BB0_393: | |
mov.u32 %r1162, %r6578; | |
mov.u32 %r1161, %r6579; | |
setp.le.u32 %p199, %r6572, %r1162; | |
mov.u32 %r6574, %r1162; | |
mov.u32 %r6575, %r1161; | |
@%p199 bra BB0_395; | |
st.local.u32 [%rd1+784], %r1162; | |
st.local.u32 [%rd1+792], %r6572; | |
st.local.u32 [%rd1+788], %r1161; | |
st.local.u32 [%rd1+796], %r6573; | |
mov.u32 %r6270, %r6573; | |
mov.u32 %r6272, %r6572; | |
mov.u32 %r6573, %r1161; | |
mov.u32 %r6572, %r1162; | |
mov.u32 %r6574, %r6272; | |
mov.u32 %r6575, %r6270; | |
BB0_395: | |
mov.u32 %r1166, %r6572; | |
mov.u32 %r1165, %r6573; | |
mov.u32 %r1164, %r6574; | |
mov.u32 %r1163, %r6575; | |
setp.le.u32 %p200, %r6556, %r1166; | |
mov.u32 %r6560, %r1166; | |
mov.u32 %r6561, %r1165; | |
mov.u32 %r6562, %r1164; | |
mov.u32 %r6563, %r1163; | |
@%p200 bra BB0_397; | |
st.local.u32 [%rd1+768], %r1166; | |
st.local.u32 [%rd1+784], %r6556; | |
st.local.u32 [%rd1+772], %r1165; | |
st.local.u32 [%rd1+788], %r6557; | |
st.local.u32 [%rd1+776], %r1164; | |
st.local.u32 [%rd1+792], %r6558; | |
st.local.u32 [%rd1+780], %r1163; | |
st.local.u32 [%rd1+796], %r6559; | |
mov.u32 %r6260, %r6559; | |
mov.u32 %r6262, %r6558; | |
mov.u32 %r6264, %r6557; | |
mov.u32 %r6266, %r6556; | |
mov.u32 %r6559, %r1163; | |
mov.u32 %r6558, %r1164; | |
mov.u32 %r6557, %r1165; | |
mov.u32 %r6556, %r1166; | |
mov.u32 %r6560, %r6266; | |
mov.u32 %r6561, %r6264; | |
mov.u32 %r6562, %r6262; | |
mov.u32 %r6563, %r6260; | |
BB0_397: | |
mov.u32 %r6540, %r6556; | |
mov.u32 %r6541, %r6557; | |
mov.u32 %r6542, %r6558; | |
mov.u32 %r6543, %r6559; | |
mov.u32 %r6544, %r6560; | |
mov.u32 %r6545, %r6561; | |
mov.u32 %r6546, %r6562; | |
mov.u32 %r6547, %r6563; | |
mul.lo.s64 %rd1552, %rd99, 1792; | |
add.s64 %rd1553, %rd136, %rd1552; | |
bfe.u32 %r3081, %r1139, 22, 6; | |
mul.wide.u32 %rd1554, %r3081, 28; | |
add.s64 %rd1555, %rd1553, %rd1554; | |
ld.global.u32 %r1175, [%rd1555+4]; | |
and.b32 %r3082, %r1175, 65535; | |
mul.wide.u32 %rd1556, %r3082, 1792; | |
add.s64 %rd1557, %rd3, %rd1556; | |
cvt.u64.u32 %rd103, %r3082; | |
bfe.u32 %r3083, %r1175, 16, 6; | |
mul.wide.u32 %rd1558, %r3083, 28; | |
add.s64 %rd1559, %rd1557, %rd1558; | |
ld.global.u32 %r1176, [%rd1559+-8]; | |
and.b32 %r3084, %r1176, 65535; | |
cvt.u64.u32 %rd104, %r3084; | |
bfe.u32 %r3085, %r1176, 16, 6; | |
mul.wide.u32 %rd1560, %r3084, 1792; | |
add.s64 %rd1561, %rd136, %rd1560; | |
mul.wide.u32 %rd1562, %r3085, 28; | |
add.s64 %rd1563, %rd1561, %rd1562; | |
ld.global.u32 %r3086, [%rd1563]; | |
and.b32 %r3087, %r3086, 65535; | |
bfe.u32 %r3088, %r3086, 16, 6; | |
mul.wide.u32 %rd1564, %r3087, 1792; | |
add.s64 %rd1565, %rd135, %rd1564; | |
mul.wide.u32 %rd1566, %r3088, 28; | |
add.s64 %rd1567, %rd1565, %rd1566; | |
ld.global.u32 %r3089, [%rd1567]; | |
and.b32 %r3090, %r3089, 65535; | |
shl.b32 %r3091, %r3090, 6; | |
bfe.u32 %r3092, %r3089, 16, 6; | |
or.b32 %r1177, %r3091, %r3092; | |
st.local.u32 [%rd1+800], %r1177; | |
bfe.u32 %r3093, %r3086, 22, 6; | |
mul.wide.u32 %rd1568, %r3093, 28; | |
add.s64 %rd1569, %rd1565, %rd1568; | |
ld.global.u32 %r3094, [%rd1569]; | |
and.b32 %r3095, %r3094, 65535; | |
shl.b32 %r3096, %r3095, 6; | |
bfe.u32 %r3097, %r3094, 16, 6; | |
or.b32 %r6593, %r3096, %r3097; | |
st.local.u32 [%rd1+804], %r6593; | |
setp.le.u32 %p201, %r1177, %r6593; | |
mov.u32 %r6592, %r1177; | |
@%p201 bra BB0_399; | |
st.local.u32 [%rd1+800], %r6593; | |
st.local.u32 [%rd1+804], %r1177; | |
mov.u32 %r6303, %r6593; | |
mov.u32 %r6593, %r1177; | |
mov.u32 %r6592, %r6303; | |
BB0_399: | |
mov.u32 %r6588, %r6592; | |
mov.u32 %r6589, %r6593; | |
bfe.u32 %r3098, %r1176, 22, 6; | |
mul.lo.s64 %rd1570, %rd104, 1792; | |
add.s64 %rd1571, %rd136, %rd1570; | |
mul.wide.u32 %rd1572, %r3098, 28; | |
add.s64 %rd1573, %rd1571, %rd1572; | |
ld.global.u32 %r3099, [%rd1573]; | |
and.b32 %r3100, %r3099, 65535; | |
bfe.u32 %r3101, %r3099, 16, 6; | |
mul.wide.u32 %rd1574, %r3100, 1792; | |
add.s64 %rd1575, %rd135, %rd1574; | |
mul.wide.u32 %rd1576, %r3101, 28; | |
add.s64 %rd1577, %rd1575, %rd1576; | |
ld.global.u32 %r3102, [%rd1577]; | |
and.b32 %r3103, %r3102, 65535; | |
shl.b32 %r3104, %r3103, 6; | |
bfe.u32 %r3105, %r3102, 16, 6; | |
or.b32 %r1181, %r3104, %r3105; | |
st.local.u32 [%rd1+808], %r1181; | |
bfe.u32 %r3106, %r3099, 22, 6; | |
mul.wide.u32 %rd1578, %r3106, 28; | |
add.s64 %rd1579, %rd1575, %rd1578; | |
ld.global.u32 %r3107, [%rd1579]; | |
and.b32 %r3108, %r3107, 65535; | |
shl.b32 %r3109, %r3108, 6; | |
bfe.u32 %r3110, %r3107, 16, 6; | |
or.b32 %r6595, %r3109, %r3110; | |
st.local.u32 [%rd1+812], %r6595; | |
setp.le.u32 %p202, %r1181, %r6595; | |
mov.u32 %r6594, %r1181; | |
@%p202 bra BB0_401; | |
st.local.u32 [%rd1+808], %r6595; | |
st.local.u32 [%rd1+812], %r1181; | |
mov.u32 %r6309, %r6595; | |
mov.u32 %r6595, %r1181; | |
mov.u32 %r6594, %r6309; | |
BB0_401: | |
mov.u32 %r1184, %r6594; | |
mov.u32 %r1183, %r6595; | |
setp.le.u32 %p203, %r6588, %r1184; | |
mov.u32 %r6590, %r1184; | |
mov.u32 %r6591, %r1183; | |
@%p203 bra BB0_403; | |
st.local.u32 [%rd1+800], %r1184; | |
st.local.u32 [%rd1+808], %r6588; | |
st.local.u32 [%rd1+804], %r1183; | |
st.local.u32 [%rd1+812], %r6589; | |
mov.u32 %r6306, %r6589; | |
mov.u32 %r6308, %r6588; | |
mov.u32 %r6589, %r1183; | |
mov.u32 %r6588, %r1184; | |
mov.u32 %r6590, %r6308; | |
mov.u32 %r6591, %r6306; | |
BB0_403: | |
mov.u32 %r6580, %r6588; | |
mov.u32 %r6581, %r6589; | |
mov.u32 %r6582, %r6590; | |
mov.u32 %r6583, %r6591; | |
mul.lo.s64 %rd1580, %rd103, 1792; | |
add.s64 %rd1581, %rd3, %rd1580; | |
bfe.u32 %r3111, %r1175, 22, 6; | |
mul.wide.u32 %rd1582, %r3111, 28; | |
add.s64 %rd1583, %rd1581, %rd1582; | |
ld.global.u32 %r1189, [%rd1583+-8]; | |
and.b32 %r3112, %r1189, 65535; | |
cvt.u64.u32 %rd105, %r3112; | |
bfe.u32 %r3113, %r1189, 16, 6; | |
mul.wide.u32 %rd1584, %r3112, 1792; | |
add.s64 %rd1585, %rd136, %rd1584; | |
mul.wide.u32 %rd1586, %r3113, 28; | |
add.s64 %rd1587, %rd1585, %rd1586; | |
ld.global.u32 %r3114, [%rd1587]; | |
and.b32 %r3115, %r3114, 65535; | |
bfe.u32 %r3116, %r3114, 16, 6; | |
mul.wide.u32 %rd1588, %r3115, 1792; | |
add.s64 %rd1589, %rd135, %rd1588; | |
mul.wide.u32 %rd1590, %r3116, 28; | |
add.s64 %rd1591, %rd1589, %rd1590; | |
ld.global.u32 %r3117, [%rd1591]; | |
and.b32 %r3118, %r3117, 65535; | |
shl.b32 %r3119, %r3118, 6; | |
bfe.u32 %r3120, %r3117, 16, 6; | |
or.b32 %r1190, %r3119, %r3120; | |
st.local.u32 [%rd1+816], %r1190; | |
bfe.u32 %r3121, %r3114, 22, 6; | |
mul.wide.u32 %rd1592, %r3121, 28; | |
add.s64 %rd1593, %rd1589, %rd1592; | |
ld.global.u32 %r3122, [%rd1593]; | |
and.b32 %r3123, %r3122, 65535; | |
shl.b32 %r3124, %r3123, 6; | |
bfe.u32 %r3125, %r3122, 16, 6; | |
or.b32 %r6601, %r3124, %r3125; | |
st.local.u32 [%rd1+820], %r6601; | |
setp.le.u32 %p204, %r1190, %r6601; | |
mov.u32 %r6600, %r1190; | |
@%p204 bra BB0_405; | |
st.local.u32 [%rd1+816], %r6601; | |
st.local.u32 [%rd1+820], %r1190; | |
mov.u32 %r6323, %r6601; | |
mov.u32 %r6601, %r1190; | |
mov.u32 %r6600, %r6323; | |
BB0_405: | |
mov.u32 %r6596, %r6600; | |
mov.u32 %r6597, %r6601; | |
bfe.u32 %r3126, %r1189, 22, 6; | |
mul.lo.s64 %rd1594, %rd105, 1792; | |
add.s64 %rd1595, %rd136, %rd1594; | |
mul.wide.u32 %rd1596, %r3126, 28; | |
add.s64 %rd1597, %rd1595, %rd1596; | |
ld.global.u32 %r3127, [%rd1597]; | |
and.b32 %r3128, %r3127, 65535; | |
bfe.u32 %r3129, %r3127, 16, 6; | |
mul.wide.u32 %rd1598, %r3128, 1792; | |
add.s64 %rd1599, %rd135, %rd1598; | |
mul.wide.u32 %rd1600, %r3129, 28; | |
add.s64 %rd1601, %rd1599, %rd1600; | |
ld.global.u32 %r3130, [%rd1601]; | |
and.b32 %r3131, %r3130, 65535; | |
shl.b32 %r3132, %r3131, 6; | |
bfe.u32 %r3133, %r3130, 16, 6; | |
or.b32 %r1194, %r3132, %r3133; | |
st.local.u32 [%rd1+824], %r1194; | |
bfe.u32 %r3134, %r3127, 22, 6; | |
mul.wide.u32 %rd1602, %r3134, 28; | |
add.s64 %rd1603, %rd1599, %rd1602; | |
ld.global.u32 %r3135, [%rd1603]; | |
and.b32 %r3136, %r3135, 65535; | |
shl.b32 %r3137, %r3136, 6; | |
bfe.u32 %r3138, %r3135, 16, 6; | |
or.b32 %r6603, %r3137, %r3138; | |
st.local.u32 [%rd1+828], %r6603; | |
setp.le.u32 %p205, %r1194, %r6603; | |
mov.u32 %r6602, %r1194; | |
@%p205 bra BB0_407; | |
st.local.u32 [%rd1+824], %r6603; | |
st.local.u32 [%rd1+828], %r1194; | |
mov.u32 %r6329, %r6603; | |
mov.u32 %r6603, %r1194; | |
mov.u32 %r6602, %r6329; | |
BB0_407: | |
mov.u32 %r1197, %r6602; | |
mov.u32 %r1196, %r6603; | |
setp.le.u32 %p206, %r6596, %r1197; | |
mov.u32 %r6598, %r1197; | |
mov.u32 %r6599, %r1196; | |
@%p206 bra BB0_409; | |
st.local.u32 [%rd1+816], %r1197; | |
st.local.u32 [%rd1+824], %r6596; | |
st.local.u32 [%rd1+820], %r1196; | |
st.local.u32 [%rd1+828], %r6597; | |
mov.u32 %r6326, %r6597; | |
mov.u32 %r6328, %r6596; | |
mov.u32 %r6597, %r1196; | |
mov.u32 %r6596, %r1197; | |
mov.u32 %r6598, %r6328; | |
mov.u32 %r6599, %r6326; | |
BB0_409: | |
mov.u32 %r1201, %r6596; | |
mov.u32 %r1200, %r6597; | |
mov.u32 %r1199, %r6598; | |
mov.u32 %r1198, %r6599; | |
setp.le.u32 %p207, %r6580, %r1201; | |
mov.u32 %r6584, %r1201; | |
mov.u32 %r6585, %r1200; | |
mov.u32 %r6586, %r1199; | |
mov.u32 %r6587, %r1198; | |
@%p207 bra BB0_411; | |
st.local.u32 [%rd1+800], %r1201; | |
st.local.u32 [%rd1+816], %r6580; | |
st.local.u32 [%rd1+804], %r1200; | |
st.local.u32 [%rd1+820], %r6581; | |
st.local.u32 [%rd1+808], %r1199; | |
st.local.u32 [%rd1+824], %r6582; | |
st.local.u32 [%rd1+812], %r1198; | |
st.local.u32 [%rd1+828], %r6583; | |
mov.u32 %r6316, %r6583; | |
mov.u32 %r6318, %r6582; | |
mov.u32 %r6320, %r6581; | |
mov.u32 %r6322, %r6580; | |
mov.u32 %r6583, %r1198; | |
mov.u32 %r6582, %r1199; | |
mov.u32 %r6581, %r1200; | |
mov.u32 %r6580, %r1201; | |
mov.u32 %r6584, %r6322; | |
mov.u32 %r6585, %r6320; | |
mov.u32 %r6586, %r6318; | |
mov.u32 %r6587, %r6316; | |
BB0_411: | |
mov.u32 %r1209, %r6580; | |
mov.u32 %r1208, %r6581; | |
mov.u32 %r1207, %r6582; | |
mov.u32 %r1206, %r6583; | |
mov.u32 %r1205, %r6584; | |
mov.u32 %r1204, %r6585; | |
mov.u32 %r1203, %r6586; | |
mov.u32 %r1202, %r6587; | |
setp.le.u32 %p208, %r6540, %r1209; | |
mov.u32 %r6548, %r1209; | |
mov.u32 %r6549, %r1208; | |
mov.u32 %r6550, %r1207; | |
mov.u32 %r6551, %r1206; | |
mov.u32 %r6552, %r1205; | |
mov.u32 %r6553, %r1204; | |
mov.u32 %r6554, %r1203; | |
mov.u32 %r6555, %r1202; | |
@%p208 bra BB0_413; | |
st.local.u32 [%rd1+768], %r1209; | |
st.local.u32 [%rd1+800], %r6540; | |
st.local.u32 [%rd1+772], %r1208; | |
st.local.u32 [%rd1+804], %r6541; | |
st.local.u32 [%rd1+776], %r1207; | |
st.local.u32 [%rd1+808], %r6542; | |
st.local.u32 [%rd1+780], %r1206; | |
st.local.u32 [%rd1+812], %r6543; | |
st.local.u32 [%rd1+784], %r1205; | |
st.local.u32 [%rd1+816], %r6544; | |
st.local.u32 [%rd1+788], %r1204; | |
st.local.u32 [%rd1+820], %r6545; | |
st.local.u32 [%rd1+792], %r1203; | |
st.local.u32 [%rd1+824], %r6546; | |
st.local.u32 [%rd1+796], %r1202; | |
st.local.u32 [%rd1+828], %r6547; | |
mov.u32 %r6288, %r6547; | |
mov.u32 %r6290, %r6546; | |
mov.u32 %r6292, %r6545; | |
mov.u32 %r6294, %r6544; | |
mov.u32 %r6296, %r6543; | |
mov.u32 %r6298, %r6542; | |
mov.u32 %r6300, %r6541; | |
mov.u32 %r6302, %r6540; | |
mov.u32 %r6547, %r1202; | |
mov.u32 %r6546, %r1203; | |
mov.u32 %r6545, %r1204; | |
mov.u32 %r6544, %r1205; | |
mov.u32 %r6543, %r1206; | |
mov.u32 %r6542, %r1207; | |
mov.u32 %r6541, %r1208; | |
mov.u32 %r6540, %r1209; | |
mov.u32 %r6548, %r6302; | |
mov.u32 %r6549, %r6300; | |
mov.u32 %r6550, %r6298; | |
mov.u32 %r6551, %r6296; | |
mov.u32 %r6552, %r6294; | |
mov.u32 %r6553, %r6292; | |
mov.u32 %r6554, %r6290; | |
mov.u32 %r6555, %r6288; | |
BB0_413: | |
mov.u32 %r1225, %r6540; | |
mul.lo.s64 %rd1604, %rd98, 1792; | |
add.s64 %rd1605, %rd3, %rd1604; | |
bfe.u32 %r3139, %r1138, 22, 6; | |
mul.wide.u32 %rd1606, %r3139, 28; | |
add.s64 %rd1607, %rd1605, %rd1606; | |
ld.global.u32 %r1226, [%rd1607+-4]; | |
and.b32 %r3140, %r1226, 65535; | |
mul.wide.u32 %rd1608, %r3140, 1792; | |
add.s64 %rd1609, %rd136, %rd1608; | |
bfe.u32 %r3141, %r1226, 16, 6; | |
mul.wide.u32 %rd1610, %r3141, 28; | |
add.s64 %rd1611, %rd1609, %rd1610; | |
ld.global.u32 %r1227, [%rd1611+4]; | |
and.b32 %r3142, %r1227, 65535; | |
mul.wide.u32 %rd1612, %r3142, 1792; | |
add.s64 %rd1613, %rd3, %rd1612; | |
cvt.u64.u32 %rd106, %r3140; | |
cvt.u64.u32 %rd107, %r3142; | |
bfe.u32 %r3143, %r1227, 16, 6; | |
mul.wide.u32 %rd1614, %r3143, 28; | |
add.s64 %rd1615, %rd1613, %rd1614; | |
ld.global.u32 %r1228, [%rd1615+-8]; | |
and.b32 %r3144, %r1228, 65535; | |
cvt.u64.u32 %rd108, %r3144; | |
bfe.u32 %r3145, %r1228, 16, 6; | |
mul.wide.u32 %rd1616, %r3144, 1792; | |
add.s64 %rd1617, %rd136, %rd1616; | |
mul.wide.u32 %rd1618, %r3145, 28; | |
add.s64 %rd1619, %rd1617, %rd1618; | |
ld.global.u32 %r3146, [%rd1619]; | |
and.b32 %r3147, %r3146, 65535; | |
bfe.u32 %r3148, %r3146, 16, 6; | |
mul.wide.u32 %rd1620, %r3147, 1792; | |
add.s64 %rd1621, %rd135, %rd1620; | |
mul.wide.u32 %rd1622, %r3148, 28; | |
add.s64 %rd1623, %rd1621, %rd1622; | |
ld.global.u32 %r3149, [%rd1623]; | |
and.b32 %r3150, %r3149, 65535; | |
shl.b32 %r3151, %r3150, 6; | |
bfe.u32 %r3152, %r3149, 16, 6; | |
or.b32 %r1229, %r3151, %r3152; | |
st.local.u32 [%rd1+832], %r1229; | |
bfe.u32 %r3153, %r3146, 22, 6; | |
mul.wide.u32 %rd1624, %r3153, 28; | |
add.s64 %rd1625, %rd1621, %rd1624; | |
ld.global.u32 %r3154, [%rd1625]; | |
and.b32 %r3155, %r3154, 65535; | |
shl.b32 %r3156, %r3155, 6; | |
bfe.u32 %r3157, %r3154, 16, 6; | |
or.b32 %r6505, %r3156, %r3157; | |
st.local.u32 [%rd1+836], %r6505; | |
setp.le.u32 %p209, %r1229, %r6505; | |
mov.u32 %r6504, %r1229; | |
@%p209 bra BB0_415; | |
st.local.u32 [%rd1+832], %r6505; | |
st.local.u32 [%rd1+836], %r1229; | |
mov.u32 %r6360, %r6505; | |
mov.u32 %r6505, %r1229; | |
mov.u32 %r6504, %r6360; | |
BB0_415: | |
mov.u32 %r6500, %r6504; | |
mov.u32 %r6501, %r6505; | |
bfe.u32 %r3158, %r1228, 22, 6; | |
mul.lo.s64 %rd1626, %rd108, 1792; | |
add.s64 %rd1627, %rd136, %rd1626; | |
mul.wide.u32 %rd1628, %r3158, 28; | |
add.s64 %rd1629, %rd1627, %rd1628; | |
ld.global.u32 %r3159, [%rd1629]; | |
and.b32 %r3160, %r3159, 65535; | |
bfe.u32 %r3161, %r3159, 16, 6; | |
mul.wide.u32 %rd1630, %r3160, 1792; | |
add.s64 %rd1631, %rd135, %rd1630; | |
mul.wide.u32 %rd1632, %r3161, 28; | |
add.s64 %rd1633, %rd1631, %rd1632; | |
ld.global.u32 %r3162, [%rd1633]; | |
and.b32 %r3163, %r3162, 65535; | |
shl.b32 %r3164, %r3163, 6; | |
bfe.u32 %r3165, %r3162, 16, 6; | |
or.b32 %r1233, %r3164, %r3165; | |
st.local.u32 [%rd1+840], %r1233; | |
bfe.u32 %r3166, %r3159, 22, 6; | |
mul.wide.u32 %rd1634, %r3166, 28; | |
add.s64 %rd1635, %rd1631, %rd1634; | |
ld.global.u32 %r3167, [%rd1635]; | |
and.b32 %r3168, %r3167, 65535; | |
shl.b32 %r3169, %r3168, 6; | |
bfe.u32 %r3170, %r3167, 16, 6; | |
or.b32 %r6507, %r3169, %r3170; | |
st.local.u32 [%rd1+844], %r6507; | |
setp.le.u32 %p210, %r1233, %r6507; | |
mov.u32 %r6506, %r1233; | |
@%p210 bra BB0_417; | |
st.local.u32 [%rd1+840], %r6507; | |
st.local.u32 [%rd1+844], %r1233; | |
mov.u32 %r6366, %r6507; | |
mov.u32 %r6507, %r1233; | |
mov.u32 %r6506, %r6366; | |
BB0_417: | |
mov.u32 %r1236, %r6506; | |
mov.u32 %r1235, %r6507; | |
setp.le.u32 %p211, %r6500, %r1236; | |
mov.u32 %r6502, %r1236; | |
mov.u32 %r6503, %r1235; | |
@%p211 bra BB0_419; | |
st.local.u32 [%rd1+832], %r1236; | |
st.local.u32 [%rd1+840], %r6500; | |
st.local.u32 [%rd1+836], %r1235; | |
st.local.u32 [%rd1+844], %r6501; | |
mov.u32 %r6363, %r6501; | |
mov.u32 %r6365, %r6500; | |
mov.u32 %r6501, %r1235; | |
mov.u32 %r6500, %r1236; | |
mov.u32 %r6502, %r6365; | |
mov.u32 %r6503, %r6363; | |
BB0_419: | |
mov.u32 %r6492, %r6500; | |
mov.u32 %r6493, %r6501; | |
mov.u32 %r6494, %r6502; | |
mov.u32 %r6495, %r6503; | |
mul.lo.s64 %rd1636, %rd107, 1792; | |
add.s64 %rd1637, %rd3, %rd1636; | |
bfe.u32 %r3171, %r1227, 22, 6; | |
mul.wide.u32 %rd1638, %r3171, 28; | |
add.s64 %rd1639, %rd1637, %rd1638; | |
ld.global.u32 %r1241, [%rd1639+-8]; | |
and.b32 %r3172, %r1241, 65535; | |
cvt.u64.u32 %rd109, %r3172; | |
bfe.u32 %r3173, %r1241, 16, 6; | |
mul.wide.u32 %rd1640, %r3172, 1792; | |
add.s64 %rd1641, %rd136, %rd1640; | |
mul.wide.u32 %rd1642, %r3173, 28; | |
add.s64 %rd1643, %rd1641, %rd1642; | |
ld.global.u32 %r3174, [%rd1643]; | |
and.b32 %r3175, %r3174, 65535; | |
bfe.u32 %r3176, %r3174, 16, 6; | |
mul.wide.u32 %rd1644, %r3175, 1792; | |
add.s64 %rd1645, %rd135, %rd1644; | |
mul.wide.u32 %rd1646, %r3176, 28; | |
add.s64 %rd1647, %rd1645, %rd1646; | |
ld.global.u32 %r3177, [%rd1647]; | |
and.b32 %r3178, %r3177, 65535; | |
shl.b32 %r3179, %r3178, 6; | |
bfe.u32 %r3180, %r3177, 16, 6; | |
or.b32 %r1242, %r3179, %r3180; | |
st.local.u32 [%rd1+848], %r1242; | |
bfe.u32 %r3181, %r3174, 22, 6; | |
mul.wide.u32 %rd1648, %r3181, 28; | |
add.s64 %rd1649, %rd1645, %rd1648; | |
ld.global.u32 %r3182, [%rd1649]; | |
and.b32 %r3183, %r3182, 65535; | |
shl.b32 %r3184, %r3183, 6; | |
bfe.u32 %r3185, %r3182, 16, 6; | |
or.b32 %r6513, %r3184, %r3185; | |
st.local.u32 [%rd1+852], %r6513; | |
setp.le.u32 %p212, %r1242, %r6513; | |
mov.u32 %r6512, %r1242; | |
@%p212 bra BB0_421; | |
st.local.u32 [%rd1+848], %r6513; | |
st.local.u32 [%rd1+852], %r1242; | |
mov.u32 %r6380, %r6513; | |
mov.u32 %r6513, %r1242; | |
mov.u32 %r6512, %r6380; | |
BB0_421: | |
mov.u32 %r6508, %r6512; | |
mov.u32 %r6509, %r6513; | |
bfe.u32 %r3186, %r1241, 22, 6; | |
mul.lo.s64 %rd1650, %rd109, 1792; | |
add.s64 %rd1651, %rd136, %rd1650; | |
mul.wide.u32 %rd1652, %r3186, 28; | |
add.s64 %rd1653, %rd1651, %rd1652; | |
ld.global.u32 %r3187, [%rd1653]; | |
and.b32 %r3188, %r3187, 65535; | |
bfe.u32 %r3189, %r3187, 16, 6; | |
mul.wide.u32 %rd1654, %r3188, 1792; | |
add.s64 %rd1655, %rd135, %rd1654; | |
mul.wide.u32 %rd1656, %r3189, 28; | |
add.s64 %rd1657, %rd1655, %rd1656; | |
ld.global.u32 %r3190, [%rd1657]; | |
and.b32 %r3191, %r3190, 65535; | |
shl.b32 %r3192, %r3191, 6; | |
bfe.u32 %r3193, %r3190, 16, 6; | |
or.b32 %r1246, %r3192, %r3193; | |
st.local.u32 [%rd1+856], %r1246; | |
bfe.u32 %r3194, %r3187, 22, 6; | |
mul.wide.u32 %rd1658, %r3194, 28; | |
add.s64 %rd1659, %rd1655, %rd1658; | |
ld.global.u32 %r3195, [%rd1659]; | |
and.b32 %r3196, %r3195, 65535; | |
shl.b32 %r3197, %r3196, 6; | |
bfe.u32 %r3198, %r3195, 16, 6; | |
or.b32 %r6515, %r3197, %r3198; | |
st.local.u32 [%rd1+860], %r6515; | |
setp.le.u32 %p213, %r1246, %r6515; | |
mov.u32 %r6514, %r1246; | |
@%p213 bra BB0_423; | |
st.local.u32 [%rd1+856], %r6515; | |
st.local.u32 [%rd1+860], %r1246; | |
mov.u32 %r6386, %r6515; | |
mov.u32 %r6515, %r1246; | |
mov.u32 %r6514, %r6386; | |
BB0_423: | |
mov.u32 %r1249, %r6514; | |
mov.u32 %r1248, %r6515; | |
setp.le.u32 %p214, %r6508, %r1249; | |
mov.u32 %r6510, %r1249; | |
mov.u32 %r6511, %r1248; | |
@%p214 bra BB0_425; | |
st.local.u32 [%rd1+848], %r1249; | |
st.local.u32 [%rd1+856], %r6508; | |
st.local.u32 [%rd1+852], %r1248; | |
st.local.u32 [%rd1+860], %r6509; | |
mov.u32 %r6383, %r6509; | |
mov.u32 %r6385, %r6508; | |
mov.u32 %r6509, %r1248; | |
mov.u32 %r6508, %r1249; | |
mov.u32 %r6510, %r6385; | |
mov.u32 %r6511, %r6383; | |
BB0_425: | |
mov.u32 %r1253, %r6508; | |
mov.u32 %r1252, %r6509; | |
mov.u32 %r1251, %r6510; | |
mov.u32 %r1250, %r6511; | |
setp.le.u32 %p215, %r6492, %r1253; | |
mov.u32 %r6496, %r1253; | |
mov.u32 %r6497, %r1252; | |
mov.u32 %r6498, %r1251; | |
mov.u32 %r6499, %r1250; | |
@%p215 bra BB0_427; | |
st.local.u32 [%rd1+832], %r1253; | |
st.local.u32 [%rd1+848], %r6492; | |
st.local.u32 [%rd1+836], %r1252; | |
st.local.u32 [%rd1+852], %r6493; | |
st.local.u32 [%rd1+840], %r1251; | |
st.local.u32 [%rd1+856], %r6494; | |
st.local.u32 [%rd1+844], %r1250; | |
st.local.u32 [%rd1+860], %r6495; | |
mov.u32 %r6373, %r6495; | |
mov.u32 %r6375, %r6494; | |
mov.u32 %r6377, %r6493; | |
mov.u32 %r6379, %r6492; | |
mov.u32 %r6495, %r1250; | |
mov.u32 %r6494, %r1251; | |
mov.u32 %r6493, %r1252; | |
mov.u32 %r6492, %r1253; | |
mov.u32 %r6496, %r6379; | |
mov.u32 %r6497, %r6377; | |
mov.u32 %r6498, %r6375; | |
mov.u32 %r6499, %r6373; | |
BB0_427: | |
mov.u32 %r6476, %r6492; | |
mov.u32 %r6477, %r6493; | |
mov.u32 %r6478, %r6494; | |
mov.u32 %r6479, %r6495; | |
mov.u32 %r6480, %r6496; | |
mov.u32 %r6481, %r6497; | |
mov.u32 %r6482, %r6498; | |
mov.u32 %r6483, %r6499; | |
mul.lo.s64 %rd1660, %rd106, 1792; | |
add.s64 %rd1661, %rd136, %rd1660; | |
bfe.u32 %r3199, %r1226, 22, 6; | |
mul.wide.u32 %rd1662, %r3199, 28; | |
add.s64 %rd1663, %rd1661, %rd1662; | |
ld.global.u32 %r1262, [%rd1663+4]; | |
and.b32 %r3200, %r1262, 65535; | |
mul.wide.u32 %rd1664, %r3200, 1792; | |
add.s64 %rd1665, %rd3, %rd1664; | |
cvt.u64.u32 %rd110, %r3200; | |
bfe.u32 %r3201, %r1262, 16, 6; | |
mul.wide.u32 %rd1666, %r3201, 28; | |
add.s64 %rd1667, %rd1665, %rd1666; | |
ld.global.u32 %r1263, [%rd1667+-8]; | |
and.b32 %r3202, %r1263, 65535; | |
cvt.u64.u32 %rd111, %r3202; | |
bfe.u32 %r3203, %r1263, 16, 6; | |
mul.wide.u32 %rd1668, %r3202, 1792; | |
add.s64 %rd1669, %rd136, %rd1668; | |
mul.wide.u32 %rd1670, %r3203, 28; | |
add.s64 %rd1671, %rd1669, %rd1670; | |
ld.global.u32 %r3204, [%rd1671]; | |
and.b32 %r3205, %r3204, 65535; | |
bfe.u32 %r3206, %r3204, 16, 6; | |
mul.wide.u32 %rd1672, %r3205, 1792; | |
add.s64 %rd1673, %rd135, %rd1672; | |
mul.wide.u32 %rd1674, %r3206, 28; | |
add.s64 %rd1675, %rd1673, %rd1674; | |
ld.global.u32 %r3207, [%rd1675]; | |
and.b32 %r3208, %r3207, 65535; | |
shl.b32 %r3209, %r3208, 6; | |
bfe.u32 %r3210, %r3207, 16, 6; | |
or.b32 %r1264, %r3209, %r3210; | |
st.local.u32 [%rd1+864], %r1264; | |
bfe.u32 %r3211, %r3204, 22, 6; | |
mul.wide.u32 %rd1676, %r3211, 28; | |
add.s64 %rd1677, %rd1673, %rd1676; | |
ld.global.u32 %r3212, [%rd1677]; | |
and.b32 %r3213, %r3212, 65535; | |
shl.b32 %r3214, %r3213, 6; | |
bfe.u32 %r3215, %r3212, 16, 6; | |
or.b32 %r6529, %r3214, %r3215; | |
st.local.u32 [%rd1+868], %r6529; | |
setp.le.u32 %p216, %r1264, %r6529; | |
mov.u32 %r6528, %r1264; | |
@%p216 bra BB0_429; | |
st.local.u32 [%rd1+864], %r6529; | |
st.local.u32 [%rd1+868], %r1264; | |
mov.u32 %r6416, %r6529; | |
mov.u32 %r6529, %r1264; | |
mov.u32 %r6528, %r6416; | |
BB0_429: | |
mov.u32 %r6524, %r6528; | |
mov.u32 %r6525, %r6529; | |
bfe.u32 %r3216, %r1263, 22, 6; | |
mul.lo.s64 %rd1678, %rd111, 1792; | |
add.s64 %rd1679, %rd136, %rd1678; | |
mul.wide.u32 %rd1680, %r3216, 28; | |
add.s64 %rd1681, %rd1679, %rd1680; | |
ld.global.u32 %r3217, [%rd1681]; | |
and.b32 %r3218, %r3217, 65535; | |
bfe.u32 %r3219, %r3217, 16, 6; | |
mul.wide.u32 %rd1682, %r3218, 1792; | |
add.s64 %rd1683, %rd135, %rd1682; | |
mul.wide.u32 %rd1684, %r3219, 28; | |
add.s64 %rd1685, %rd1683, %rd1684; | |
ld.global.u32 %r3220, [%rd1685]; | |
and.b32 %r3221, %r3220, 65535; | |
shl.b32 %r3222, %r3221, 6; | |
bfe.u32 %r3223, %r3220, 16, 6; | |
or.b32 %r1268, %r3222, %r3223; | |
st.local.u32 [%rd1+872], %r1268; | |
bfe.u32 %r3224, %r3217, 22, 6; | |
mul.wide.u32 %rd1686, %r3224, 28; | |
add.s64 %rd1687, %rd1683, %rd1686; | |
ld.global.u32 %r3225, [%rd1687]; | |
and.b32 %r3226, %r3225, 65535; | |
shl.b32 %r3227, %r3226, 6; | |
bfe.u32 %r3228, %r3225, 16, 6; | |
or.b32 %r6531, %r3227, %r3228; | |
st.local.u32 [%rd1+876], %r6531; | |
setp.le.u32 %p217, %r1268, %r6531; | |
mov.u32 %r6530, %r1268; | |
@%p217 bra BB0_431; | |
st.local.u32 [%rd1+872], %r6531; | |
st.local.u32 [%rd1+876], %r1268; | |
mov.u32 %r6422, %r6531; | |
mov.u32 %r6531, %r1268; | |
mov.u32 %r6530, %r6422; | |
BB0_431: | |
mov.u32 %r1271, %r6530; | |
mov.u32 %r1270, %r6531; | |
setp.le.u32 %p218, %r6524, %r1271; | |
mov.u32 %r6526, %r1271; | |
mov.u32 %r6527, %r1270; | |
@%p218 bra BB0_433; | |
st.local.u32 [%rd1+864], %r1271; | |
st.local.u32 [%rd1+872], %r6524; | |
st.local.u32 [%rd1+868], %r1270; | |
st.local.u32 [%rd1+876], %r6525; | |
mov.u32 %r6419, %r6525; | |
mov.u32 %r6421, %r6524; | |
mov.u32 %r6525, %r1270; | |
mov.u32 %r6524, %r1271; | |
mov.u32 %r6526, %r6421; | |
mov.u32 %r6527, %r6419; | |
BB0_433: | |
mov.u32 %r6516, %r6524; | |
mov.u32 %r6517, %r6525; | |
mov.u32 %r6518, %r6526; | |
mov.u32 %r6519, %r6527; | |
mul.lo.s64 %rd1688, %rd110, 1792; | |
add.s64 %rd1689, %rd3, %rd1688; | |
bfe.u32 %r3229, %r1262, 22, 6; | |
mul.wide.u32 %rd1690, %r3229, 28; | |
add.s64 %rd1691, %rd1689, %rd1690; | |
ld.global.u32 %r1276, [%rd1691+-8]; | |
and.b32 %r3230, %r1276, 65535; | |
cvt.u64.u32 %rd112, %r3230; | |
bfe.u32 %r3231, %r1276, 16, 6; | |
mul.wide.u32 %rd1692, %r3230, 1792; | |
add.s64 %rd1693, %rd136, %rd1692; | |
mul.wide.u32 %rd1694, %r3231, 28; | |
add.s64 %rd1695, %rd1693, %rd1694; | |
ld.global.u32 %r3232, [%rd1695]; | |
and.b32 %r3233, %r3232, 65535; | |
bfe.u32 %r3234, %r3232, 16, 6; | |
mul.wide.u32 %rd1696, %r3233, 1792; | |
add.s64 %rd1697, %rd135, %rd1696; | |
mul.wide.u32 %rd1698, %r3234, 28; | |
add.s64 %rd1699, %rd1697, %rd1698; | |
ld.global.u32 %r3235, [%rd1699]; | |
and.b32 %r3236, %r3235, 65535; | |
shl.b32 %r3237, %r3236, 6; | |
bfe.u32 %r3238, %r3235, 16, 6; | |
or.b32 %r1277, %r3237, %r3238; | |
st.local.u32 [%rd1+880], %r1277; | |
bfe.u32 %r3239, %r3232, 22, 6; | |
mul.wide.u32 %rd1700, %r3239, 28; | |
add.s64 %rd1701, %rd1697, %rd1700; | |
ld.global.u32 %r3240, [%rd1701]; | |
and.b32 %r3241, %r3240, 65535; | |
shl.b32 %r3242, %r3241, 6; | |
bfe.u32 %r3243, %r3240, 16, 6; | |
or.b32 %r6537, %r3242, %r3243; | |
st.local.u32 [%rd1+884], %r6537; | |
setp.le.u32 %p219, %r1277, %r6537; | |
mov.u32 %r6536, %r1277; | |
@%p219 bra BB0_435; | |
st.local.u32 [%rd1+880], %r6537; | |
st.local.u32 [%rd1+884], %r1277; | |
mov.u32 %r6436, %r6537; | |
mov.u32 %r6537, %r1277; | |
mov.u32 %r6536, %r6436; | |
BB0_435: | |
mov.u32 %r6532, %r6536; | |
mov.u32 %r6533, %r6537; | |
bfe.u32 %r3244, %r1276, 22, 6; | |
mul.lo.s64 %rd1702, %rd112, 1792; | |
add.s64 %rd1703, %rd136, %rd1702; | |
mul.wide.u32 %rd1704, %r3244, 28; | |
add.s64 %rd1705, %rd1703, %rd1704; | |
ld.global.u32 %r3245, [%rd1705]; | |
and.b32 %r3246, %r3245, 65535; | |
bfe.u32 %r3247, %r3245, 16, 6; | |
mul.wide.u32 %rd1706, %r3246, 1792; | |
add.s64 %rd1707, %rd135, %rd1706; | |
mul.wide.u32 %rd1708, %r3247, 28; | |
add.s64 %rd1709, %rd1707, %rd1708; | |
ld.global.u32 %r3248, [%rd1709]; | |
and.b32 %r3249, %r3248, 65535; | |
shl.b32 %r3250, %r3249, 6; | |
bfe.u32 %r3251, %r3248, 16, 6; | |
or.b32 %r1281, %r3250, %r3251; | |
st.local.u32 [%rd1+888], %r1281; | |
bfe.u32 %r3252, %r3245, 22, 6; | |
mul.wide.u32 %rd1710, %r3252, 28; | |
add.s64 %rd1711, %rd1707, %rd1710; | |
ld.global.u32 %r3253, [%rd1711]; | |
and.b32 %r3254, %r3253, 65535; | |
shl.b32 %r3255, %r3254, 6; | |
bfe.u32 %r3256, %r3253, 16, 6; | |
or.b32 %r6539, %r3255, %r3256; | |
st.local.u32 [%rd1+892], %r6539; | |
setp.le.u32 %p220, %r1281, %r6539; | |
mov.u32 %r6538, %r1281; | |
@%p220 bra BB0_437; | |
st.local.u32 [%rd1+888], %r6539; | |
st.local.u32 [%rd1+892], %r1281; | |
mov.u32 %r6442, %r6539; | |
mov.u32 %r6539, %r1281; | |
mov.u32 %r6538, %r6442; | |
BB0_437: | |
mov.u32 %r1284, %r6538; | |
mov.u32 %r1283, %r6539; | |
setp.le.u32 %p221, %r6532, %r1284; | |
mov.u32 %r6534, %r1284; | |
mov.u32 %r6535, %r1283; | |
@%p221 bra BB0_439; | |
st.local.u32 [%rd1+880], %r1284; | |
st.local.u32 [%rd1+888], %r6532; | |
st.local.u32 [%rd1+884], %r1283; | |
st.local.u32 [%rd1+892], %r6533; | |
mov.u32 %r6439, %r6533; | |
mov.u32 %r6441, %r6532; | |
mov.u32 %r6533, %r1283; | |
mov.u32 %r6532, %r1284; | |
mov.u32 %r6534, %r6441; | |
mov.u32 %r6535, %r6439; | |
BB0_439: | |
mov.u32 %r1288, %r6532; | |
mov.u32 %r1287, %r6533; | |
mov.u32 %r1286, %r6534; | |
mov.u32 %r1285, %r6535; | |
setp.le.u32 %p222, %r6516, %r1288; | |
mov.u32 %r6520, %r1288; | |
mov.u32 %r6521, %r1287; | |
mov.u32 %r6522, %r1286; | |
mov.u32 %r6523, %r1285; | |
@%p222 bra BB0_441; | |
st.local.u32 [%rd1+864], %r1288; | |
st.local.u32 [%rd1+880], %r6516; | |
st.local.u32 [%rd1+868], %r1287; | |
st.local.u32 [%rd1+884], %r6517; | |
st.local.u32 [%rd1+872], %r1286; | |
st.local.u32 [%rd1+888], %r6518; | |
st.local.u32 [%rd1+876], %r1285; | |
st.local.u32 [%rd1+892], %r6519; | |
mov.u32 %r6429, %r6519; | |
mov.u32 %r6431, %r6518; | |
mov.u32 %r6433, %r6517; | |
mov.u32 %r6435, %r6516; | |
mov.u32 %r6519, %r1285; | |
mov.u32 %r6518, %r1286; | |
mov.u32 %r6517, %r1287; | |
mov.u32 %r6516, %r1288; | |
mov.u32 %r6520, %r6435; | |
mov.u32 %r6521, %r6433; | |
mov.u32 %r6522, %r6431; | |
mov.u32 %r6523, %r6429; | |
BB0_441: | |
mov.u32 %r1296, %r6516; | |
mov.u32 %r1295, %r6517; | |
mov.u32 %r1294, %r6518; | |
mov.u32 %r1293, %r6519; | |
mov.u32 %r1292, %r6520; | |
mov.u32 %r1291, %r6521; | |
mov.u32 %r1290, %r6522; | |
mov.u32 %r1289, %r6523; | |
setp.le.u32 %p223, %r6476, %r1296; | |
mov.u32 %r6484, %r1296; | |
mov.u32 %r6485, %r1295; | |
mov.u32 %r6486, %r1294; | |
mov.u32 %r6487, %r1293; | |
mov.u32 %r6488, %r1292; | |
mov.u32 %r6489, %r1291; | |
mov.u32 %r6490, %r1290; | |
mov.u32 %r6491, %r1289; | |
@%p223 bra BB0_443; | |
st.local.u32 [%rd1+832], %r1296; | |
st.local.u32 [%rd1+864], %r6476; | |
st.local.u32 [%rd1+836], %r1295; | |
st.local.u32 [%rd1+868], %r6477; | |
st.local.u32 [%rd1+840], %r1294; | |
st.local.u32 [%rd1+872], %r6478; | |
st.local.u32 [%rd1+844], %r1293; | |
st.local.u32 [%rd1+876], %r6479; | |
st.local.u32 [%rd1+848], %r1292; | |
st.local.u32 [%rd1+880], %r6480; | |
st.local.u32 [%rd1+852], %r1291; | |
st.local.u32 [%rd1+884], %r6481; | |
st.local.u32 [%rd1+856], %r1290; | |
st.local.u32 [%rd1+888], %r6482; | |
st.local.u32 [%rd1+860], %r1289; | |
st.local.u32 [%rd1+892], %r6483; | |
mov.u32 %r6401, %r6483; | |
mov.u32 %r6403, %r6482; | |
mov.u32 %r6405, %r6481; | |
mov.u32 %r6407, %r6480; | |
mov.u32 %r6409, %r6479; | |
mov.u32 %r6411, %r6478; | |
mov.u32 %r6413, %r6477; | |
mov.u32 %r6415, %r6476; | |
mov.u32 %r6483, %r1289; | |
mov.u32 %r6482, %r1290; | |
mov.u32 %r6481, %r1291; | |
mov.u32 %r6480, %r1292; | |
mov.u32 %r6479, %r1293; | |
mov.u32 %r6478, %r1294; | |
mov.u32 %r6477, %r1295; | |
mov.u32 %r6476, %r1296; | |
mov.u32 %r6484, %r6415; | |
mov.u32 %r6485, %r6413; | |
mov.u32 %r6486, %r6411; | |
mov.u32 %r6487, %r6409; | |
mov.u32 %r6488, %r6407; | |
mov.u32 %r6489, %r6405; | |
mov.u32 %r6490, %r6403; | |
mov.u32 %r6491, %r6401; | |
BB0_443: | |
mov.u32 %r1312, %r6476; | |
setp.le.u32 %p224, %r1225, %r1312; | |
mov.u32 %r6475, %r1225; | |
@%p224 bra BB0_445; | |
st.local.u32 [%rd1+768], %r1312; | |
st.local.u32 [%rd1+832], %r1225; | |
st.local.u32 [%rd1+772], %r6477; | |
st.local.u32 [%rd1+836], %r6541; | |
st.local.u32 [%rd1+776], %r6478; | |
st.local.u32 [%rd1+840], %r6542; | |
st.local.u32 [%rd1+780], %r6479; | |
st.local.u32 [%rd1+844], %r6543; | |
st.local.u32 [%rd1+784], %r6480; | |
st.local.u32 [%rd1+848], %r6544; | |
st.local.u32 [%rd1+788], %r6481; | |
st.local.u32 [%rd1+852], %r6545; | |
st.local.u32 [%rd1+792], %r6482; | |
st.local.u32 [%rd1+856], %r6546; | |
st.local.u32 [%rd1+796], %r6483; | |
st.local.u32 [%rd1+860], %r6547; | |
st.local.u32 [%rd1+800], %r6484; | |
st.local.u32 [%rd1+864], %r6548; | |
st.local.u32 [%rd1+804], %r6485; | |
st.local.u32 [%rd1+868], %r6549; | |
st.local.u32 [%rd1+808], %r6486; | |
st.local.u32 [%rd1+872], %r6550; | |
st.local.u32 [%rd1+812], %r6487; | |
st.local.u32 [%rd1+876], %r6551; | |
st.local.u32 [%rd1+816], %r6488; | |
st.local.u32 [%rd1+880], %r6552; | |
st.local.u32 [%rd1+820], %r6489; | |
st.local.u32 [%rd1+884], %r6553; | |
st.local.u32 [%rd1+824], %r6490; | |
st.local.u32 [%rd1+888], %r6554; | |
st.local.u32 [%rd1+828], %r6491; | |
st.local.u32 [%rd1+892], %r6555; | |
mov.u32 %r6475, %r1312; | |
BB0_445: | |
mov.u32 %r6474, %r6475; | |
mul.lo.s64 %rd1713, %rd97, 1792; | |
add.s64 %rd1714, %rd146, %rd1713; | |
bfe.u32 %r3257, %r1137, 22, 6; | |
mul.wide.u32 %rd1715, %r3257, 28; | |
add.s64 %rd1716, %rd1714, %rd1715; | |
ld.global.u32 %r1314, [%rd1716+4]; | |
and.b32 %r3258, %r1314, 65535; | |
mul.wide.u32 %rd1717, %r3258, 1792; | |
add.s64 %rd1718, %rd3, %rd1717; | |
bfe.u32 %r3259, %r1314, 16, 6; | |
mul.wide.u32 %rd1719, %r3259, 28; | |
add.s64 %rd1720, %rd1718, %rd1719; | |
ld.global.u32 %r1315, [%rd1720+-4]; | |
and.b32 %r3260, %r1315, 65535; | |
bfe.u32 %r3261, %r1315, 16, 6; | |
mul.wide.u32 %rd1721, %r3260, 1792; | |
add.s64 %rd1722, %rd146, %rd1721; | |
mul.wide.u32 %rd1723, %r3261, 28; | |
add.s64 %rd1724, %rd1722, %rd1723; | |
ld.global.u32 %r1316, [%rd1724]; | |
and.b32 %r3262, %r1316, 65535; | |
mul.wide.u32 %rd1725, %r3262, 1792; | |
add.s64 %rd1726, %rd3, %rd1725; | |
cvt.u64.u32 %rd113, %r3258; | |
cvt.u64.u32 %rd114, %r3260; | |
cvt.u64.u32 %rd115, %r3262; | |
bfe.u32 %r3263, %r1316, 16, 6; | |
mul.wide.u32 %rd1727, %r3263, 28; | |
add.s64 %rd1728, %rd1726, %rd1727; | |
ld.global.u32 %r1317, [%rd1728+-8]; | |
and.b32 %r3264, %r1317, 65535; | |
cvt.u64.u32 %rd116, %r3264; | |
bfe.u32 %r3265, %r1317, 16, 6; | |
mul.wide.u32 %rd1729, %r3264, 1792; | |
add.s64 %rd1730, %rd136, %rd1729; | |
mul.wide.u32 %rd1731, %r3265, 28; | |
add.s64 %rd1732, %rd1730, %rd1731; | |
ld.global.u32 %r3266, [%rd1732]; | |
and.b32 %r3267, %r3266, 65535; | |
bfe.u32 %r3268, %r3266, 16, 6; | |
mul.wide.u32 %rd1733, %r3267, 1792; | |
add.s64 %rd1734, %rd135, %rd1733; | |
mul.wide.u32 %rd1735, %r3268, 28; | |
add.s64 %rd1736, %rd1734, %rd1735; | |
ld.global.u32 %r3269, [%rd1736]; | |
and.b32 %r3270, %r3269, 65535; | |
shl.b32 %r3271, %r3270, 6; | |
bfe.u32 %r3272, %r3269, 16, 6; | |
or.b32 %r1318, %r3271, %r3272; | |
st.local.u32 [%rd1+896], %r1318; | |
bfe.u32 %r3273, %r3266, 22, 6; | |
mul.wide.u32 %rd1737, %r3273, 28; | |
add.s64 %rd1738, %rd1734, %rd1737; | |
ld.global.u32 %r3274, [%rd1738]; | |
and.b32 %r3275, %r3274, 65535; | |
shl.b32 %r3276, %r3275, 6; | |
bfe.u32 %r3277, %r3274, 16, 6; | |
or.b32 %r6211, %r3276, %r3277; | |
st.local.u32 [%rd1+900], %r6211; | |
setp.le.u32 %p225, %r1318, %r6211; | |
mov.u32 %r6210, %r1318; | |
@%p225 bra BB0_447; | |
st.local.u32 [%rd1+896], %r6211; | |
st.local.u32 [%rd1+900], %r1318; | |
mov.u32 %r5891, %r6211; | |
mov.u32 %r6211, %r1318; | |
mov.u32 %r6210, %r5891; | |
BB0_447: | |
mov.u32 %r6206, %r6210; | |
mov.u32 %r6207, %r6211; | |
bfe.u32 %r3278, %r1317, 22, 6; | |
mul.lo.s64 %rd1739, %rd116, 1792; | |
add.s64 %rd1740, %rd136, %rd1739; | |
mul.wide.u32 %rd1741, %r3278, 28; | |
add.s64 %rd1742, %rd1740, %rd1741; | |
ld.global.u32 %r3279, [%rd1742]; | |
and.b32 %r3280, %r3279, 65535; | |
bfe.u32 %r3281, %r3279, 16, 6; | |
mul.wide.u32 %rd1743, %r3280, 1792; | |
add.s64 %rd1744, %rd135, %rd1743; | |
mul.wide.u32 %rd1745, %r3281, 28; | |
add.s64 %rd1746, %rd1744, %rd1745; | |
ld.global.u32 %r3282, [%rd1746]; | |
and.b32 %r3283, %r3282, 65535; | |
shl.b32 %r3284, %r3283, 6; | |
bfe.u32 %r3285, %r3282, 16, 6; | |
or.b32 %r1322, %r3284, %r3285; | |
st.local.u32 [%rd1+904], %r1322; | |
bfe.u32 %r3286, %r3279, 22, 6; | |
mul.wide.u32 %rd1747, %r3286, 28; | |
add.s64 %rd1748, %rd1744, %rd1747; | |
ld.global.u32 %r3287, [%rd1748]; | |
and.b32 %r3288, %r3287, 65535; | |
shl.b32 %r3289, %r3288, 6; | |
bfe.u32 %r3290, %r3287, 16, 6; | |
or.b32 %r6213, %r3289, %r3290; | |
st.local.u32 [%rd1+908], %r6213; | |
setp.le.u32 %p226, %r1322, %r6213; | |
mov.u32 %r6212, %r1322; | |
@%p226 bra BB0_449; | |
st.local.u32 [%rd1+904], %r6213; | |
st.local.u32 [%rd1+908], %r1322; | |
mov.u32 %r5897, %r6213; | |
mov.u32 %r6213, %r1322; | |
mov.u32 %r6212, %r5897; | |
BB0_449: | |
mov.u32 %r1325, %r6212; | |
mov.u32 %r1324, %r6213; | |
setp.le.u32 %p227, %r6206, %r1325; | |
mov.u32 %r6208, %r1325; | |
mov.u32 %r6209, %r1324; | |
@%p227 bra BB0_451; | |
st.local.u32 [%rd1+896], %r1325; | |
st.local.u32 [%rd1+904], %r6206; | |
st.local.u32 [%rd1+900], %r1324; | |
st.local.u32 [%rd1+908], %r6207; | |
mov.u32 %r5894, %r6207; | |
mov.u32 %r5896, %r6206; | |
mov.u32 %r6207, %r1324; | |
mov.u32 %r6206, %r1325; | |
mov.u32 %r6208, %r5896; | |
mov.u32 %r6209, %r5894; | |
BB0_451: | |
mov.u32 %r6198, %r6206; | |
mov.u32 %r6199, %r6207; | |
mov.u32 %r6200, %r6208; | |
mov.u32 %r6201, %r6209; | |
mul.lo.s64 %rd1749, %rd115, 1792; | |
add.s64 %rd1750, %rd3, %rd1749; | |
bfe.u32 %r3291, %r1316, 22, 6; | |
mul.wide.u32 %rd1751, %r3291, 28; | |
add.s64 %rd1752, %rd1750, %rd1751; | |
ld.global.u32 %r1330, [%rd1752+-8]; | |
and.b32 %r3292, %r1330, 65535; | |
cvt.u64.u32 %rd117, %r3292; | |
bfe.u32 %r3293, %r1330, 16, 6; | |
mul.wide.u32 %rd1753, %r3292, 1792; | |
add.s64 %rd1754, %rd136, %rd1753; | |
mul.wide.u32 %rd1755, %r3293, 28; | |
add.s64 %rd1756, %rd1754, %rd1755; | |
ld.global.u32 %r3294, [%rd1756]; | |
and.b32 %r3295, %r3294, 65535; | |
bfe.u32 %r3296, %r3294, 16, 6; | |
mul.wide.u32 %rd1757, %r3295, 1792; | |
add.s64 %rd1758, %rd135, %rd1757; | |
mul.wide.u32 %rd1759, %r3296, 28; | |
add.s64 %rd1760, %rd1758, %rd1759; | |
ld.global.u32 %r3297, [%rd1760]; | |
and.b32 %r3298, %r3297, 65535; | |
shl.b32 %r3299, %r3298, 6; | |
bfe.u32 %r3300, %r3297, 16, 6; | |
or.b32 %r1331, %r3299, %r3300; | |
st.local.u32 [%rd1+912], %r1331; | |
bfe.u32 %r3301, %r3294, 22, 6; | |
mul.wide.u32 %rd1761, %r3301, 28; | |
add.s64 %rd1762, %rd1758, %rd1761; | |
ld.global.u32 %r3302, [%rd1762]; | |
and.b32 %r3303, %r3302, 65535; | |
shl.b32 %r3304, %r3303, 6; | |
bfe.u32 %r3305, %r3302, 16, 6; | |
or.b32 %r6219, %r3304, %r3305; | |
st.local.u32 [%rd1+916], %r6219; | |
setp.le.u32 %p228, %r1331, %r6219; | |
mov.u32 %r6218, %r1331; | |
@%p228 bra BB0_453; | |
st.local.u32 [%rd1+912], %r6219; | |
st.local.u32 [%rd1+916], %r1331; | |
mov.u32 %r5911, %r6219; | |
mov.u32 %r6219, %r1331; | |
mov.u32 %r6218, %r5911; | |
BB0_453: | |
mov.u32 %r6214, %r6218; | |
mov.u32 %r6215, %r6219; | |
bfe.u32 %r3306, %r1330, 22, 6; | |
mul.lo.s64 %rd1763, %rd117, 1792; | |
add.s64 %rd1764, %rd136, %rd1763; | |
mul.wide.u32 %rd1765, %r3306, 28; | |
add.s64 %rd1766, %rd1764, %rd1765; | |
ld.global.u32 %r3307, [%rd1766]; | |
and.b32 %r3308, %r3307, 65535; | |
bfe.u32 %r3309, %r3307, 16, 6; | |
mul.wide.u32 %rd1767, %r3308, 1792; | |
add.s64 %rd1768, %rd135, %rd1767; | |
mul.wide.u32 %rd1769, %r3309, 28; | |
add.s64 %rd1770, %rd1768, %rd1769; | |
ld.global.u32 %r3310, [%rd1770]; | |
and.b32 %r3311, %r3310, 65535; | |
shl.b32 %r3312, %r3311, 6; | |
bfe.u32 %r3313, %r3310, 16, 6; | |
or.b32 %r1335, %r3312, %r3313; | |
st.local.u32 [%rd1+920], %r1335; | |
bfe.u32 %r3314, %r3307, 22, 6; | |
mul.wide.u32 %rd1771, %r3314, 28; | |
add.s64 %rd1772, %rd1768, %rd1771; | |
ld.global.u32 %r3315, [%rd1772]; | |
and.b32 %r3316, %r3315, 65535; | |
shl.b32 %r3317, %r3316, 6; | |
bfe.u32 %r3318, %r3315, 16, 6; | |
or.b32 %r6221, %r3317, %r3318; | |
st.local.u32 [%rd1+924], %r6221; | |
setp.le.u32 %p229, %r1335, %r6221; | |
mov.u32 %r6220, %r1335; | |
@%p229 bra BB0_455; | |
st.local.u32 [%rd1+920], %r6221; | |
st.local.u32 [%rd1+924], %r1335; | |
mov.u32 %r5917, %r6221; | |
mov.u32 %r6221, %r1335; | |
mov.u32 %r6220, %r5917; | |
BB0_455: | |
mov.u32 %r1338, %r6220; | |
mov.u32 %r1337, %r6221; | |
setp.le.u32 %p230, %r6214, %r1338; | |
mov.u32 %r6216, %r1338; | |
mov.u32 %r6217, %r1337; | |
@%p230 bra BB0_457; | |
st.local.u32 [%rd1+912], %r1338; | |
st.local.u32 [%rd1+920], %r6214; | |
st.local.u32 [%rd1+916], %r1337; | |
st.local.u32 [%rd1+924], %r6215; | |
mov.u32 %r5914, %r6215; | |
mov.u32 %r5916, %r6214; | |
mov.u32 %r6215, %r1337; | |
mov.u32 %r6214, %r1338; | |
mov.u32 %r6216, %r5916; | |
mov.u32 %r6217, %r5914; | |
BB0_457: | |
mov.u32 %r1342, %r6214; | |
mov.u32 %r1341, %r6215; | |
mov.u32 %r1340, %r6216; | |
mov.u32 %r1339, %r6217; | |
setp.le.u32 %p231, %r6198, %r1342; | |
mov.u32 %r6202, %r1342; | |
mov.u32 %r6203, %r1341; | |
mov.u32 %r6204, %r1340; | |
mov.u32 %r6205, %r1339; | |
@%p231 bra BB0_459; | |
st.local.u32 [%rd1+896], %r1342; | |
st.local.u32 [%rd1+912], %r6198; | |
st.local.u32 [%rd1+900], %r1341; | |
st.local.u32 [%rd1+916], %r6199; | |
st.local.u32 [%rd1+904], %r1340; | |
st.local.u32 [%rd1+920], %r6200; | |
st.local.u32 [%rd1+908], %r1339; | |
st.local.u32 [%rd1+924], %r6201; | |
mov.u32 %r5904, %r6201; | |
mov.u32 %r5906, %r6200; | |
mov.u32 %r5908, %r6199; | |
mov.u32 %r5910, %r6198; | |
mov.u32 %r6201, %r1339; | |
mov.u32 %r6200, %r1340; | |
mov.u32 %r6199, %r1341; | |
mov.u32 %r6198, %r1342; | |
mov.u32 %r6202, %r5910; | |
mov.u32 %r6203, %r5908; | |
mov.u32 %r6204, %r5906; | |
mov.u32 %r6205, %r5904; | |
BB0_459: | |
mov.u32 %r6182, %r6198; | |
mov.u32 %r6183, %r6199; | |
mov.u32 %r6184, %r6200; | |
mov.u32 %r6185, %r6201; | |
mov.u32 %r6186, %r6202; | |
mov.u32 %r6187, %r6203; | |
mov.u32 %r6188, %r6204; | |
mov.u32 %r6189, %r6205; | |
mul.lo.s64 %rd1773, %rd114, 1792; | |
add.s64 %rd1774, %rd136, %rd1773; | |
bfe.u32 %r3319, %r1315, 22, 6; | |
mul.wide.u32 %rd1775, %r3319, 28; | |
add.s64 %rd1776, %rd1774, %rd1775; | |
ld.global.u32 %r1351, [%rd1776+4]; | |
and.b32 %r3320, %r1351, 65535; | |
mul.wide.u32 %rd1777, %r3320, 1792; | |
add.s64 %rd1778, %rd3, %rd1777; | |
cvt.u64.u32 %rd118, %r3320; | |
bfe.u32 %r3321, %r1351, 16, 6; | |
mul.wide.u32 %rd1779, %r3321, 28; | |
add.s64 %rd1780, %rd1778, %rd1779; | |
ld.global.u32 %r1352, [%rd1780+-8]; | |
and.b32 %r3322, %r1352, 65535; | |
cvt.u64.u32 %rd119, %r3322; | |
bfe.u32 %r3323, %r1352, 16, 6; | |
mul.wide.u32 %rd1781, %r3322, 1792; | |
add.s64 %rd1782, %rd136, %rd1781; | |
mul.wide.u32 %rd1783, %r3323, 28; | |
add.s64 %rd1784, %rd1782, %rd1783; | |
ld.global.u32 %r3324, [%rd1784]; | |
and.b32 %r3325, %r3324, 65535; | |
bfe.u32 %r3326, %r3324, 16, 6; | |
mul.wide.u32 %rd1785, %r3325, 1792; | |
add.s64 %rd1786, %rd135, %rd1785; | |
mul.wide.u32 %rd1787, %r3326, 28; | |
add.s64 %rd1788, %rd1786, %rd1787; | |
ld.global.u32 %r3327, [%rd1788]; | |
and.b32 %r3328, %r3327, 65535; | |
shl.b32 %r3329, %r3328, 6; | |
bfe.u32 %r3330, %r3327, 16, 6; | |
or.b32 %r1353, %r3329, %r3330; | |
st.local.u32 [%rd1+928], %r1353; | |
bfe.u32 %r3331, %r3324, 22, 6; | |
mul.wide.u32 %rd1789, %r3331, 28; | |
add.s64 %rd1790, %rd1786, %rd1789; | |
ld.global.u32 %r3332, [%rd1790]; | |
and.b32 %r3333, %r3332, 65535; | |
shl.b32 %r3334, %r3333, 6; | |
bfe.u32 %r3335, %r3332, 16, 6; | |
or.b32 %r6235, %r3334, %r3335; | |
st.local.u32 [%rd1+932], %r6235; | |
setp.le.u32 %p232, %r1353, %r6235; | |
mov.u32 %r6234, %r1353; | |
@%p232 bra BB0_461; | |
st.local.u32 [%rd1+928], %r6235; | |
st.local.u32 [%rd1+932], %r1353; | |
mov.u32 %r5947, %r6235; | |
mov.u32 %r6235, %r1353; | |
mov.u32 %r6234, %r5947; | |
BB0_461: | |
mov.u32 %r6230, %r6234; | |
mov.u32 %r6231, %r6235; | |
bfe.u32 %r3336, %r1352, 22, 6; | |
mul.lo.s64 %rd1791, %rd119, 1792; | |
add.s64 %rd1792, %rd136, %rd1791; | |
mul.wide.u32 %rd1793, %r3336, 28; | |
add.s64 %rd1794, %rd1792, %rd1793; | |
ld.global.u32 %r3337, [%rd1794]; | |
and.b32 %r3338, %r3337, 65535; | |
bfe.u32 %r3339, %r3337, 16, 6; | |
mul.wide.u32 %rd1795, %r3338, 1792; | |
add.s64 %rd1796, %rd135, %rd1795; | |
mul.wide.u32 %rd1797, %r3339, 28; | |
add.s64 %rd1798, %rd1796, %rd1797; | |
ld.global.u32 %r3340, [%rd1798]; | |
and.b32 %r3341, %r3340, 65535; | |
shl.b32 %r3342, %r3341, 6; | |
bfe.u32 %r3343, %r3340, 16, 6; | |
or.b32 %r1357, %r3342, %r3343; | |
st.local.u32 [%rd1+936], %r1357; | |
bfe.u32 %r3344, %r3337, 22, 6; | |
mul.wide.u32 %rd1799, %r3344, 28; | |
add.s64 %rd1800, %rd1796, %rd1799; | |
ld.global.u32 %r3345, [%rd1800]; | |
and.b32 %r3346, %r3345, 65535; | |
shl.b32 %r3347, %r3346, 6; | |
bfe.u32 %r3348, %r3345, 16, 6; | |
or.b32 %r6237, %r3347, %r3348; | |
st.local.u32 [%rd1+940], %r6237; | |
setp.le.u32 %p233, %r1357, %r6237; | |
mov.u32 %r6236, %r1357; | |
@%p233 bra BB0_463; | |
st.local.u32 [%rd1+936], %r6237; | |
st.local.u32 [%rd1+940], %r1357; | |
mov.u32 %r5953, %r6237; | |
mov.u32 %r6237, %r1357; | |
mov.u32 %r6236, %r5953; | |
BB0_463: | |
mov.u32 %r1360, %r6236; | |
mov.u32 %r1359, %r6237; | |
setp.le.u32 %p234, %r6230, %r1360; | |
mov.u32 %r6232, %r1360; | |
mov.u32 %r6233, %r1359; | |
@%p234 bra BB0_465; | |
st.local.u32 [%rd1+928], %r1360; | |
st.local.u32 [%rd1+936], %r6230; | |
st.local.u32 [%rd1+932], %r1359; | |
st.local.u32 [%rd1+940], %r6231; | |
mov.u32 %r5950, %r6231; | |
mov.u32 %r5952, %r6230; | |
mov.u32 %r6231, %r1359; | |
mov.u32 %r6230, %r1360; | |
mov.u32 %r6232, %r5952; | |
mov.u32 %r6233, %r5950; | |
BB0_465: | |
mov.u32 %r6222, %r6230; | |
mov.u32 %r6223, %r6231; | |
mov.u32 %r6224, %r6232; | |
mov.u32 %r6225, %r6233; | |
mul.lo.s64 %rd1801, %rd118, 1792; | |
add.s64 %rd1802, %rd3, %rd1801; | |
bfe.u32 %r3349, %r1351, 22, 6; | |
mul.wide.u32 %rd1803, %r3349, 28; | |
add.s64 %rd1804, %rd1802, %rd1803; | |
ld.global.u32 %r1365, [%rd1804+-8]; | |
and.b32 %r3350, %r1365, 65535; | |
cvt.u64.u32 %rd120, %r3350; | |
bfe.u32 %r3351, %r1365, 16, 6; | |
mul.wide.u32 %rd1805, %r3350, 1792; | |
add.s64 %rd1806, %rd136, %rd1805; | |
mul.wide.u32 %rd1807, %r3351, 28; | |
add.s64 %rd1808, %rd1806, %rd1807; | |
ld.global.u32 %r3352, [%rd1808]; | |
and.b32 %r3353, %r3352, 65535; | |
bfe.u32 %r3354, %r3352, 16, 6; | |
mul.wide.u32 %rd1809, %r3353, 1792; | |
add.s64 %rd1810, %rd135, %rd1809; | |
mul.wide.u32 %rd1811, %r3354, 28; | |
add.s64 %rd1812, %rd1810, %rd1811; | |
ld.global.u32 %r3355, [%rd1812]; | |
and.b32 %r3356, %r3355, 65535; | |
shl.b32 %r3357, %r3356, 6; | |
bfe.u32 %r3358, %r3355, 16, 6; | |
or.b32 %r1366, %r3357, %r3358; | |
st.local.u32 [%rd1+944], %r1366; | |
bfe.u32 %r3359, %r3352, 22, 6; | |
mul.wide.u32 %rd1813, %r3359, 28; | |
add.s64 %rd1814, %rd1810, %rd1813; | |
ld.global.u32 %r3360, [%rd1814]; | |
and.b32 %r3361, %r3360, 65535; | |
shl.b32 %r3362, %r3361, 6; | |
bfe.u32 %r3363, %r3360, 16, 6; | |
or.b32 %r6243, %r3362, %r3363; | |
st.local.u32 [%rd1+948], %r6243; | |
setp.le.u32 %p235, %r1366, %r6243; | |
mov.u32 %r6242, %r1366; | |
@%p235 bra BB0_467; | |
st.local.u32 [%rd1+944], %r6243; | |
st.local.u32 [%rd1+948], %r1366; | |
mov.u32 %r5967, %r6243; | |
mov.u32 %r6243, %r1366; | |
mov.u32 %r6242, %r5967; | |
BB0_467: | |
mov.u32 %r6238, %r6242; | |
mov.u32 %r6239, %r6243; | |
bfe.u32 %r3364, %r1365, 22, 6; | |
mul.lo.s64 %rd1815, %rd120, 1792; | |
add.s64 %rd1816, %rd136, %rd1815; | |
mul.wide.u32 %rd1817, %r3364, 28; | |
add.s64 %rd1818, %rd1816, %rd1817; | |
ld.global.u32 %r3365, [%rd1818]; | |
and.b32 %r3366, %r3365, 65535; | |
bfe.u32 %r3367, %r3365, 16, 6; | |
mul.wide.u32 %rd1819, %r3366, 1792; | |
add.s64 %rd1820, %rd135, %rd1819; | |
mul.wide.u32 %rd1821, %r3367, 28; | |
add.s64 %rd1822, %rd1820, %rd1821; | |
ld.global.u32 %r3368, [%rd1822]; | |
and.b32 %r3369, %r3368, 65535; | |
shl.b32 %r3370, %r3369, 6; | |
bfe.u32 %r3371, %r3368, 16, 6; | |
or.b32 %r1370, %r3370, %r3371; | |
st.local.u32 [%rd1+952], %r1370; | |
bfe.u32 %r3372, %r3365, 22, 6; | |
mul.wide.u32 %rd1823, %r3372, 28; | |
add.s64 %rd1824, %rd1820, %rd1823; | |
ld.global.u32 %r3373, [%rd1824]; | |
and.b32 %r3374, %r3373, 65535; | |
shl.b32 %r3375, %r3374, 6; | |
bfe.u32 %r3376, %r3373, 16, 6; | |
or.b32 %r6245, %r3375, %r3376; | |
st.local.u32 [%rd1+956], %r6245; | |
setp.le.u32 %p236, %r1370, %r6245; | |
mov.u32 %r6244, %r1370; | |
@%p236 bra BB0_469; | |
st.local.u32 [%rd1+952], %r6245; | |
st.local.u32 [%rd1+956], %r1370; | |
mov.u32 %r5973, %r6245; | |
mov.u32 %r6245, %r1370; | |
mov.u32 %r6244, %r5973; | |
BB0_469: | |
mov.u32 %r1373, %r6244; | |
mov.u32 %r1372, %r6245; | |
setp.le.u32 %p237, %r6238, %r1373; | |
mov.u32 %r6240, %r1373; | |
mov.u32 %r6241, %r1372; | |
@%p237 bra BB0_471; | |
st.local.u32 [%rd1+944], %r1373; | |
st.local.u32 [%rd1+952], %r6238; | |
st.local.u32 [%rd1+948], %r1372; | |
st.local.u32 [%rd1+956], %r6239; | |
mov.u32 %r5970, %r6239; | |
mov.u32 %r5972, %r6238; | |
mov.u32 %r6239, %r1372; | |
mov.u32 %r6238, %r1373; | |
mov.u32 %r6240, %r5972; | |
mov.u32 %r6241, %r5970; | |
BB0_471: | |
mov.u32 %r1377, %r6238; | |
mov.u32 %r1376, %r6239; | |
mov.u32 %r1375, %r6240; | |
mov.u32 %r1374, %r6241; | |
setp.le.u32 %p238, %r6222, %r1377; | |
mov.u32 %r6226, %r1377; | |
mov.u32 %r6227, %r1376; | |
mov.u32 %r6228, %r1375; | |
mov.u32 %r6229, %r1374; | |
@%p238 bra BB0_473; | |
st.local.u32 [%rd1+928], %r1377; | |
st.local.u32 [%rd1+944], %r6222; | |
st.local.u32 [%rd1+932], %r1376; | |
st.local.u32 [%rd1+948], %r6223; | |
st.local.u32 [%rd1+936], %r1375; | |
st.local.u32 [%rd1+952], %r6224; | |
st.local.u32 [%rd1+940], %r1374; | |
st.local.u32 [%rd1+956], %r6225; | |
mov.u32 %r5960, %r6225; | |
mov.u32 %r5962, %r6224; | |
mov.u32 %r5964, %r6223; | |
mov.u32 %r5966, %r6222; | |
mov.u32 %r6225, %r1374; | |
mov.u32 %r6224, %r1375; | |
mov.u32 %r6223, %r1376; | |
mov.u32 %r6222, %r1377; | |
mov.u32 %r6226, %r5966; | |
mov.u32 %r6227, %r5964; | |
mov.u32 %r6228, %r5962; | |
mov.u32 %r6229, %r5960; | |
BB0_473: | |
mov.u32 %r1385, %r6222; | |
mov.u32 %r1384, %r6223; | |
mov.u32 %r1383, %r6224; | |
mov.u32 %r1382, %r6225; | |
mov.u32 %r1381, %r6226; | |
mov.u32 %r1380, %r6227; | |
mov.u32 %r1379, %r6228; | |
mov.u32 %r1378, %r6229; | |
setp.le.u32 %p239, %r6182, %r1385; | |
mov.u32 %r6190, %r1385; | |
mov.u32 %r6191, %r1384; | |
mov.u32 %r6192, %r1383; | |
mov.u32 %r6193, %r1382; | |
mov.u32 %r6194, %r1381; | |
mov.u32 %r6195, %r1380; | |
mov.u32 %r6196, %r1379; | |
mov.u32 %r6197, %r1378; | |
@%p239 bra BB0_475; | |
st.local.u32 [%rd1+896], %r1385; | |
st.local.u32 [%rd1+928], %r6182; | |
st.local.u32 [%rd1+900], %r1384; | |
st.local.u32 [%rd1+932], %r6183; | |
st.local.u32 [%rd1+904], %r1383; | |
st.local.u32 [%rd1+936], %r6184; | |
st.local.u32 [%rd1+908], %r1382; | |
st.local.u32 [%rd1+940], %r6185; | |
st.local.u32 [%rd1+912], %r1381; | |
st.local.u32 [%rd1+944], %r6186; | |
st.local.u32 [%rd1+916], %r1380; | |
st.local.u32 [%rd1+948], %r6187; | |
st.local.u32 [%rd1+920], %r1379; | |
st.local.u32 [%rd1+952], %r6188; | |
st.local.u32 [%rd1+924], %r1378; | |
st.local.u32 [%rd1+956], %r6189; | |
mov.u32 %r5932, %r6189; | |
mov.u32 %r5934, %r6188; | |
mov.u32 %r5936, %r6187; | |
mov.u32 %r5938, %r6186; | |
mov.u32 %r5940, %r6185; | |
mov.u32 %r5942, %r6184; | |
mov.u32 %r5944, %r6183; | |
mov.u32 %r5946, %r6182; | |
mov.u32 %r6189, %r1378; | |
mov.u32 %r6188, %r1379; | |
mov.u32 %r6187, %r1380; | |
mov.u32 %r6186, %r1381; | |
mov.u32 %r6185, %r1382; | |
mov.u32 %r6184, %r1383; | |
mov.u32 %r6183, %r1384; | |
mov.u32 %r6182, %r1385; | |
mov.u32 %r6190, %r5946; | |
mov.u32 %r6191, %r5944; | |
mov.u32 %r6192, %r5942; | |
mov.u32 %r6193, %r5940; | |
mov.u32 %r6194, %r5938; | |
mov.u32 %r6195, %r5936; | |
mov.u32 %r6196, %r5934; | |
mov.u32 %r6197, %r5932; | |
BB0_475: | |
mov.u32 %r1401, %r6182; | |
mul.lo.s64 %rd1825, %rd113, 1792; | |
add.s64 %rd1826, %rd3, %rd1825; | |
bfe.u32 %r3377, %r1314, 22, 6; | |
mul.wide.u32 %rd1827, %r3377, 28; | |
add.s64 %rd1828, %rd1826, %rd1827; | |
ld.global.u32 %r1402, [%rd1828+-4]; | |
and.b32 %r3378, %r1402, 65535; | |
mul.wide.u32 %rd1829, %r3378, 1792; | |
add.s64 %rd1830, %rd136, %rd1829; | |
bfe.u32 %r3379, %r1402, 16, 6; | |
mul.wide.u32 %rd1831, %r3379, 28; | |
add.s64 %rd1832, %rd1830, %rd1831; | |
ld.global.u32 %r1403, [%rd1832+4]; | |
and.b32 %r3380, %r1403, 65535; | |
mul.wide.u32 %rd1833, %r3380, 1792; | |
add.s64 %rd1834, %rd3, %rd1833; | |
cvt.u64.u32 %rd121, %r3378; | |
cvt.u64.u32 %rd122, %r3380; | |
bfe.u32 %r3381, %r1403, 16, 6; | |
mul.wide.u32 %rd1835, %r3381, 28; | |
add.s64 %rd1836, %rd1834, %rd1835; | |
ld.global.u32 %r1404, [%rd1836+-8]; | |
and.b32 %r3382, %r1404, 65535; | |
cvt.u64.u32 %rd123, %r3382; | |
bfe.u32 %r3383, %r1404, 16, 6; | |
mul.wide.u32 %rd1837, %r3382, 1792; | |
add.s64 %rd1838, %rd136, %rd1837; | |
mul.wide.u32 %rd1839, %r3383, 28; | |
add.s64 %rd1840, %rd1838, %rd1839; | |
ld.global.u32 %r3384, [%rd1840]; | |
and.b32 %r3385, %r3384, 65535; | |
bfe.u32 %r3386, %r3384, 16, 6; | |
mul.wide.u32 %rd1841, %r3385, 1792; | |
add.s64 %rd1842, %rd135, %rd1841; | |
mul.wide.u32 %rd1843, %r3386, 28; | |
add.s64 %rd1844, %rd1842, %rd1843; | |
ld.global.u32 %r3387, [%rd1844]; | |
and.b32 %r3388, %r3387, 65535; | |
shl.b32 %r3389, %r3388, 6; | |
bfe.u32 %r3390, %r3387, 16, 6; | |
or.b32 %r1405, %r3389, %r3390; | |
st.local.u32 [%rd1+960], %r1405; | |
bfe.u32 %r3391, %r3384, 22, 6; | |
mul.wide.u32 %rd1845, %r3391, 28; | |
add.s64 %rd1846, %rd1842, %rd1845; | |
ld.global.u32 %r3392, [%rd1846]; | |
and.b32 %r3393, %r3392, 65535; | |
shl.b32 %r3394, %r3393, 6; | |
bfe.u32 %r3395, %r3392, 16, 6; | |
or.b32 %r6147, %r3394, %r3395; | |
st.local.u32 [%rd1+964], %r6147; | |
setp.le.u32 %p240, %r1405, %r6147; | |
mov.u32 %r6146, %r1405; | |
@%p240 bra BB0_477; | |
st.local.u32 [%rd1+960], %r6147; | |
st.local.u32 [%rd1+964], %r1405; | |
mov.u32 %r6004, %r6147; | |
mov.u32 %r6147, %r1405; | |
mov.u32 %r6146, %r6004; | |
BB0_477: | |
mov.u32 %r6142, %r6146; | |
mov.u32 %r6143, %r6147; | |
bfe.u32 %r3396, %r1404, 22, 6; | |
mul.lo.s64 %rd1847, %rd123, 1792; | |
add.s64 %rd1848, %rd136, %rd1847; | |
mul.wide.u32 %rd1849, %r3396, 28; | |
add.s64 %rd1850, %rd1848, %rd1849; | |
ld.global.u32 %r3397, [%rd1850]; | |
and.b32 %r3398, %r3397, 65535; | |
bfe.u32 %r3399, %r3397, 16, 6; | |
mul.wide.u32 %rd1851, %r3398, 1792; | |
add.s64 %rd1852, %rd135, %rd1851; | |
mul.wide.u32 %rd1853, %r3399, 28; | |
add.s64 %rd1854, %rd1852, %rd1853; | |
ld.global.u32 %r3400, [%rd1854]; | |
and.b32 %r3401, %r3400, 65535; | |
shl.b32 %r3402, %r3401, 6; | |
bfe.u32 %r3403, %r3400, 16, 6; | |
or.b32 %r1409, %r3402, %r3403; | |
st.local.u32 [%rd1+968], %r1409; | |
bfe.u32 %r3404, %r3397, 22, 6; | |
mul.wide.u32 %rd1855, %r3404, 28; | |
add.s64 %rd1856, %rd1852, %rd1855; | |
ld.global.u32 %r3405, [%rd1856]; | |
and.b32 %r3406, %r3405, 65535; | |
shl.b32 %r3407, %r3406, 6; | |
bfe.u32 %r3408, %r3405, 16, 6; | |
or.b32 %r6149, %r3407, %r3408; | |
st.local.u32 [%rd1+972], %r6149; | |
setp.le.u32 %p241, %r1409, %r6149; | |
mov.u32 %r6148, %r1409; | |
@%p241 bra BB0_479; | |
st.local.u32 [%rd1+968], %r6149; | |
st.local.u32 [%rd1+972], %r1409; | |
mov.u32 %r6010, %r6149; | |
mov.u32 %r6149, %r1409; | |
mov.u32 %r6148, %r6010; | |
BB0_479: | |
mov.u32 %r1412, %r6148; | |
mov.u32 %r1411, %r6149; | |
setp.le.u32 %p242, %r6142, %r1412; | |
mov.u32 %r6144, %r1412; | |
mov.u32 %r6145, %r1411; | |
@%p242 bra BB0_481; | |
st.local.u32 [%rd1+960], %r1412; | |
st.local.u32 [%rd1+968], %r6142; | |
st.local.u32 [%rd1+964], %r1411; | |
st.local.u32 [%rd1+972], %r6143; | |
mov.u32 %r6007, %r6143; | |
mov.u32 %r6009, %r6142; | |
mov.u32 %r6143, %r1411; | |
mov.u32 %r6142, %r1412; | |
mov.u32 %r6144, %r6009; | |
mov.u32 %r6145, %r6007; | |
BB0_481: | |
mov.u32 %r6134, %r6142; | |
mov.u32 %r6135, %r6143; | |
mov.u32 %r6136, %r6144; | |
mov.u32 %r6137, %r6145; | |
mul.lo.s64 %rd1857, %rd122, 1792; | |
add.s64 %rd1858, %rd3, %rd1857; | |
bfe.u32 %r3409, %r1403, 22, 6; | |
mul.wide.u32 %rd1859, %r3409, 28; | |
add.s64 %rd1860, %rd1858, %rd1859; | |
ld.global.u32 %r1417, [%rd1860+-8]; | |
and.b32 %r3410, %r1417, 65535; | |
cvt.u64.u32 %rd124, %r3410; | |
bfe.u32 %r3411, %r1417, 16, 6; | |
mul.wide.u32 %rd1861, %r3410, 1792; | |
add.s64 %rd1862, %rd136, %rd1861; | |
mul.wide.u32 %rd1863, %r3411, 28; | |
add.s64 %rd1864, %rd1862, %rd1863; | |
ld.global.u32 %r3412, [%rd1864]; | |
and.b32 %r3413, %r3412, 65535; | |
bfe.u32 %r3414, %r3412, 16, 6; | |
mul.wide.u32 %rd1865, %r3413, 1792; | |
add.s64 %rd1866, %rd135, %rd1865; | |
mul.wide.u32 %rd1867, %r3414, 28; | |
add.s64 %rd1868, %rd1866, %rd1867; | |
ld.global.u32 %r3415, [%rd1868]; | |
and.b32 %r3416, %r3415, 65535; | |
shl.b32 %r3417, %r3416, 6; | |
bfe.u32 %r3418, %r3415, 16, 6; | |
or.b32 %r1418, %r3417, %r3418; | |
st.local.u32 [%rd1+976], %r1418; | |
bfe.u32 %r3419, %r3412, 22, 6; | |
mul.wide.u32 %rd1869, %r3419, 28; | |
add.s64 %rd1870, %rd1866, %rd1869; | |
ld.global.u32 %r3420, [%rd1870]; | |
and.b32 %r3421, %r3420, 65535; | |
shl.b32 %r3422, %r3421, 6; | |
bfe.u32 %r3423, %r3420, 16, 6; | |
or.b32 %r6155, %r3422, %r3423; | |
st.local.u32 [%rd1+980], %r6155; | |
setp.le.u32 %p243, %r1418, %r6155; | |
mov.u32 %r6154, %r1418; | |
@%p243 bra BB0_483; | |
st.local.u32 [%rd1+976], %r6155; | |
st.local.u32 [%rd1+980], %r1418; | |
mov.u32 %r6024, %r6155; | |
mov.u32 %r6155, %r1418; | |
mov.u32 %r6154, %r6024; | |
BB0_483: | |
mov.u32 %r6150, %r6154; | |
mov.u32 %r6151, %r6155; | |
bfe.u32 %r3424, %r1417, 22, 6; | |
mul.lo.s64 %rd1871, %rd124, 1792; | |
add.s64 %rd1872, %rd136, %rd1871; | |
mul.wide.u32 %rd1873, %r3424, 28; | |
add.s64 %rd1874, %rd1872, %rd1873; | |
ld.global.u32 %r3425, [%rd1874]; | |
and.b32 %r3426, %r3425, 65535; | |
bfe.u32 %r3427, %r3425, 16, 6; | |
mul.wide.u32 %rd1875, %r3426, 1792; | |
add.s64 %rd1876, %rd135, %rd1875; | |
mul.wide.u32 %rd1877, %r3427, 28; | |
add.s64 %rd1878, %rd1876, %rd1877; | |
ld.global.u32 %r3428, [%rd1878]; | |
and.b32 %r3429, %r3428, 65535; | |
shl.b32 %r3430, %r3429, 6; | |
bfe.u32 %r3431, %r3428, 16, 6; | |
or.b32 %r1422, %r3430, %r3431; | |
st.local.u32 [%rd1+984], %r1422; | |
bfe.u32 %r3432, %r3425, 22, 6; | |
mul.wide.u32 %rd1879, %r3432, 28; | |
add.s64 %rd1880, %rd1876, %rd1879; | |
ld.global.u32 %r3433, [%rd1880]; | |
and.b32 %r3434, %r3433, 65535; | |
shl.b32 %r3435, %r3434, 6; | |
bfe.u32 %r3436, %r3433, 16, 6; | |
or.b32 %r6157, %r3435, %r3436; | |
st.local.u32 [%rd1+988], %r6157; | |
setp.le.u32 %p244, %r1422, %r6157; | |
mov.u32 %r6156, %r1422; | |
@%p244 bra BB0_485; | |
st.local.u32 [%rd1+984], %r6157; | |
st.local.u32 [%rd1+988], %r1422; | |
mov.u32 %r6030, %r6157; | |
mov.u32 %r6157, %r1422; | |
mov.u32 %r6156, %r6030; | |
BB0_485: | |
mov.u32 %r1425, %r6156; | |
mov.u32 %r1424, %r6157; | |
setp.le.u32 %p245, %r6150, %r1425; | |
mov.u32 %r6152, %r1425; | |
mov.u32 %r6153, %r1424; | |
@%p245 bra BB0_487; | |
st.local.u32 [%rd1+976], %r1425; | |
st.local.u32 [%rd1+984], %r6150; | |
st.local.u32 [%rd1+980], %r1424; | |
st.local.u32 [%rd1+988], %r6151; | |
mov.u32 %r6027, %r6151; | |
mov.u32 %r6029, %r6150; | |
mov.u32 %r6151, %r1424; | |
mov.u32 %r6150, %r1425; | |
mov.u32 %r6152, %r6029; | |
mov.u32 %r6153, %r6027; | |
BB0_487: | |
mov.u32 %r1429, %r6150; | |
mov.u32 %r1428, %r6151; | |
mov.u32 %r1427, %r6152; | |
mov.u32 %r1426, %r6153; | |
setp.le.u32 %p246, %r6134, %r1429; | |
mov.u32 %r6138, %r1429; | |
mov.u32 %r6139, %r1428; | |
mov.u32 %r6140, %r1427; | |
mov.u32 %r6141, %r1426; | |
@%p246 bra BB0_489; | |
st.local.u32 [%rd1+960], %r1429; | |
st.local.u32 [%rd1+976], %r6134; | |
st.local.u32 [%rd1+964], %r1428; | |
st.local.u32 [%rd1+980], %r6135; | |
st.local.u32 [%rd1+968], %r1427; | |
st.local.u32 [%rd1+984], %r6136; | |
st.local.u32 [%rd1+972], %r1426; | |
st.local.u32 [%rd1+988], %r6137; | |
mov.u32 %r6017, %r6137; | |
mov.u32 %r6019, %r6136; | |
mov.u32 %r6021, %r6135; | |
mov.u32 %r6023, %r6134; | |
mov.u32 %r6137, %r1426; | |
mov.u32 %r6136, %r1427; | |
mov.u32 %r6135, %r1428; | |
mov.u32 %r6134, %r1429; | |
mov.u32 %r6138, %r6023; | |
mov.u32 %r6139, %r6021; | |
mov.u32 %r6140, %r6019; | |
mov.u32 %r6141, %r6017; | |
BB0_489: | |
mov.u32 %r6118, %r6134; | |
mov.u32 %r6119, %r6135; | |
mov.u32 %r6120, %r6136; | |
mov.u32 %r6121, %r6137; | |
mov.u32 %r6122, %r6138; | |
mov.u32 %r6123, %r6139; | |
mov.u32 %r6124, %r6140; | |
mov.u32 %r6125, %r6141; | |
mul.lo.s64 %rd1881, %rd121, 1792; | |
add.s64 %rd1882, %rd136, %rd1881; | |
bfe.u32 %r3437, %r1402, 22, 6; | |
mul.wide.u32 %rd1883, %r3437, 28; | |
add.s64 %rd1884, %rd1882, %rd1883; | |
ld.global.u32 %r1438, [%rd1884+4]; | |
and.b32 %r3438, %r1438, 65535; | |
mul.wide.u32 %rd1885, %r3438, 1792; | |
add.s64 %rd1886, %rd3, %rd1885; | |
cvt.u64.u32 %rd125, %r3438; | |
bfe.u32 %r3439, %r1438, 16, 6; | |
mul.wide.u32 %rd1887, %r3439, 28; | |
add.s64 %rd1888, %rd1886, %rd1887; | |
ld.global.u32 %r1439, [%rd1888+-8]; | |
and.b32 %r3440, %r1439, 65535; | |
cvt.u64.u32 %rd126, %r3440; | |
bfe.u32 %r3441, %r1439, 16, 6; | |
mul.wide.u32 %rd1889, %r3440, 1792; | |
add.s64 %rd1890, %rd136, %rd1889; | |
mul.wide.u32 %rd1891, %r3441, 28; | |
add.s64 %rd1892, %rd1890, %rd1891; | |
ld.global.u32 %r3442, [%rd1892]; | |
and.b32 %r3443, %r3442, 65535; | |
bfe.u32 %r3444, %r3442, 16, 6; | |
mul.wide.u32 %rd1893, %r3443, 1792; | |
add.s64 %rd1894, %rd135, %rd1893; | |
mul.wide.u32 %rd1895, %r3444, 28; | |
add.s64 %rd1896, %rd1894, %rd1895; | |
ld.global.u32 %r3445, [%rd1896]; | |
and.b32 %r3446, %r3445, 65535; | |
shl.b32 %r3447, %r3446, 6; | |
bfe.u32 %r3448, %r3445, 16, 6; | |
or.b32 %r1440, %r3447, %r3448; | |
st.local.u32 [%rd1+992], %r1440; | |
bfe.u32 %r3449, %r3442, 22, 6; | |
mul.wide.u32 %rd1897, %r3449, 28; | |
add.s64 %rd1898, %rd1894, %rd1897; | |
ld.global.u32 %r3450, [%rd1898]; | |
and.b32 %r3451, %r3450, 65535; | |
shl.b32 %r3452, %r3451, 6; | |
bfe.u32 %r3453, %r3450, 16, 6; | |
or.b32 %r6171, %r3452, %r3453; | |
st.local.u32 [%rd1+996], %r6171; | |
setp.le.u32 %p247, %r1440, %r6171; | |
mov.u32 %r6170, %r1440; | |
@%p247 bra BB0_491; | |
st.local.u32 [%rd1+992], %r6171; | |
st.local.u32 [%rd1+996], %r1440; | |
mov.u32 %r6060, %r6171; | |
mov.u32 %r6171, %r1440; | |
mov.u32 %r6170, %r6060; | |
BB0_491: | |
mov.u32 %r6166, %r6170; | |
mov.u32 %r6167, %r6171; | |
bfe.u32 %r3454, %r1439, 22, 6; | |
mul.lo.s64 %rd1899, %rd126, 1792; | |
add.s64 %rd1900, %rd136, %rd1899; | |
mul.wide.u32 %rd1901, %r3454, 28; | |
add.s64 %rd1902, %rd1900, %rd1901; | |
ld.global.u32 %r3455, [%rd1902]; | |
and.b32 %r3456, %r3455, 65535; | |
bfe.u32 %r3457, %r3455, 16, 6; | |
mul.wide.u32 %rd1903, %r3456, 1792; | |
add.s64 %rd1904, %rd135, %rd1903; | |
mul.wide.u32 %rd1905, %r3457, 28; | |
add.s64 %rd1906, %rd1904, %rd1905; | |
ld.global.u32 %r3458, [%rd1906]; | |
and.b32 %r3459, %r3458, 65535; | |
shl.b32 %r3460, %r3459, 6; | |
bfe.u32 %r3461, %r3458, 16, 6; | |
or.b32 %r1444, %r3460, %r3461; | |
st.local.u32 [%rd1+1000], %r1444; | |
bfe.u32 %r3462, %r3455, 22, 6; | |
mul.wide.u32 %rd1907, %r3462, 28; | |
add.s64 %rd1908, %rd1904, %rd1907; | |
ld.global.u32 %r3463, [%rd1908]; | |
and.b32 %r3464, %r3463, 65535; | |
shl.b32 %r3465, %r3464, 6; | |
bfe.u32 %r3466, %r3463, 16, 6; | |
or.b32 %r6173, %r3465, %r3466; | |
st.local.u32 [%rd1+1004], %r6173; | |
setp.le.u32 %p248, %r1444, %r6173; | |
mov.u32 %r6172, %r1444; | |
@%p248 bra BB0_493; | |
st.local.u32 [%rd1+1000], %r6173; | |
st.local.u32 [%rd1+1004], %r1444; | |
mov.u32 %r6066, %r6173; | |
mov.u32 %r6173, %r1444; | |
mov.u32 %r6172, %r6066; | |
BB0_493: | |
mov.u32 %r1447, %r6172; | |
mov.u32 %r1446, %r6173; | |
setp.le.u32 %p249, %r6166, %r1447; | |
mov.u32 %r6168, %r1447; | |
mov.u32 %r6169, %r1446; | |
@%p249 bra BB0_495; | |
st.local.u32 [%rd1+992], %r1447; | |
st.local.u32 [%rd1+1000], %r6166; | |
st.local.u32 [%rd1+996], %r1446; | |
st.local.u32 [%rd1+1004], %r6167; | |
mov.u32 %r6063, %r6167; | |
mov.u32 %r6065, %r6166; | |
mov.u32 %r6167, %r1446; | |
mov.u32 %r6166, %r1447; | |
mov.u32 %r6168, %r6065; | |
mov.u32 %r6169, %r6063; | |
BB0_495: | |
mov.u32 %r6158, %r6166; | |
mov.u32 %r6159, %r6167; | |
mov.u32 %r6160, %r6168; | |
mov.u32 %r6161, %r6169; | |
mul.lo.s64 %rd1909, %rd125, 1792; | |
add.s64 %rd1910, %rd3, %rd1909; | |
bfe.u32 %r3467, %r1438, 22, 6; | |
mul.wide.u32 %rd1911, %r3467, 28; | |
add.s64 %rd1912, %rd1910, %rd1911; | |
ld.global.u32 %r1452, [%rd1912+-8]; | |
and.b32 %r3468, %r1452, 65535; | |
cvt.u64.u32 %rd127, %r3468; | |
bfe.u32 %r3469, %r1452, 16, 6; | |
mul.wide.u32 %rd1913, %r3468, 1792; | |
add.s64 %rd1914, %rd136, %rd1913; | |
mul.wide.u32 %rd1915, %r3469, 28; | |
add.s64 %rd1916, %rd1914, %rd1915; | |
ld.global.u32 %r3470, [%rd1916]; | |
and.b32 %r3471, %r3470, 65535; | |
bfe.u32 %r3472, %r3470, 16, 6; | |
mul.wide.u32 %rd1917, %r3471, 1792; | |
add.s64 %rd1918, %rd135, %rd1917; | |
mul.wide.u32 %rd1919, %r3472, 28; | |
add.s64 %rd1920, %rd1918, %rd1919; | |
ld.global.u32 %r3473, [%rd1920]; | |
and.b32 %r3474, %r3473, 65535; | |
shl.b32 %r3475, %r3474, 6; | |
bfe.u32 %r3476, %r3473, 16, 6; | |
or.b32 %r1453, %r3475, %r3476; | |
st.local.u32 [%rd1+1008], %r1453; | |
bfe.u32 %r3477, %r3470, 22, 6; | |
mul.wide.u32 %rd1921, %r3477, 28; | |
add.s64 %rd1922, %rd1918, %rd1921; | |
ld.global.u32 %r3478, [%rd1922]; | |
and.b32 %r3479, %r3478, 65535; | |
shl.b32 %r3480, %r3479, 6; | |
bfe.u32 %r3481, %r3478, 16, 6; | |
or.b32 %r6179, %r3480, %r3481; | |
st.local.u32 [%rd1+1012], %r6179; | |
setp.le.u32 %p250, %r1453, %r6179; | |
mov.u32 %r6178, %r1453; | |
@%p250 bra BB0_497; | |
st.local.u32 [%rd1+1008], %r6179; | |
st.local.u32 [%rd1+1012], %r1453; | |
mov.u32 %r6080, %r6179; | |
mov.u32 %r6179, %r1453; | |
mov.u32 %r6178, %r6080; | |
BB0_497: | |
mov.u32 %r6174, %r6178; | |
mov.u32 %r6175, %r6179; | |
bfe.u32 %r3482, %r1452, 22, 6; | |
mul.lo.s64 %rd1923, %rd127, 1792; | |
add.s64 %rd1924, %rd136, %rd1923; | |
mul.wide.u32 %rd1925, %r3482, 28; | |
add.s64 %rd1926, %rd1924, %rd1925; | |
ld.global.u32 %r3483, [%rd1926]; | |
and.b32 %r3484, %r3483, 65535; | |
bfe.u32 %r3485, %r3483, 16, 6; | |
mul.wide.u32 %rd1927, %r3484, 1792; | |
add.s64 %rd1928, %rd135, %rd1927; | |
mul.wide.u32 %rd1929, %r3485, 28; | |
add.s64 %rd1930, %rd1928, %rd1929; | |
ld.global.u32 %r3486, [%rd1930]; | |
and.b32 %r3487, %r3486, 65535; | |
shl.b32 %r3488, %r3487, 6; | |
bfe.u32 %r3489, %r3486, 16, 6; | |
or.b32 %r1457, %r3488, %r3489; | |
st.local.u32 [%rd1+1016], %r1457; | |
bfe.u32 %r3490, %r3483, 22, 6; | |
mul.wide.u32 %rd1931, %r3490, 28; | |
add.s64 %rd1932, %rd1928, %rd1931; | |
ld.global.u32 %r3491, [%rd1932]; | |
and.b32 %r3492, %r3491, 65535; | |
shl.b32 %r3493, %r3492, 6; | |
bfe.u32 %r3494, %r3491, 16, 6; | |
or.b32 %r6181, %r3493, %r3494; | |
st.local.u32 [%rd1+1020], %r6181; | |
setp.le.u32 %p251, %r1457, %r6181; | |
mov.u32 %r6180, %r1457; | |
@%p251 bra BB0_499; | |
st.local.u32 [%rd1+1016], %r6181; | |
st.local.u32 [%rd1+1020], %r1457; | |
mov.u32 %r6086, %r6181; | |
mov.u32 %r6181, %r1457; | |
mov.u32 %r6180, %r6086; | |
BB0_499: | |
mov.u32 %r1460, %r6180; | |
mov.u32 %r1459, %r6181; | |
setp.le.u32 %p252, %r6174, %r1460; | |
mov.u32 %r6176, %r1460; | |
mov.u32 %r6177, %r1459; | |
@%p252 bra BB0_501; | |
st.local.u32 [%rd1+1008], %r1460; | |
st.local.u32 [%rd1+1016], %r6174; | |
st.local.u32 [%rd1+1012], %r1459; | |
st.local.u32 [%rd1+1020], %r6175; | |
mov.u32 %r6083, %r6175; | |
mov.u32 %r6085, %r6174; | |
mov.u32 %r6175, %r1459; | |
mov.u32 %r6174, %r1460; | |
mov.u32 %r6176, %r6085; | |
mov.u32 %r6177, %r6083; | |
BB0_501: | |
mov.u32 %r1464, %r6174; | |
mov.u32 %r1463, %r6175; | |
mov.u32 %r1462, %r6176; | |
mov.u32 %r1461, %r6177; | |
setp.le.u32 %p253, %r6158, %r1464; | |
mov.u32 %r6162, %r1464; | |
mov.u32 %r6163, %r1463; | |
mov.u32 %r6164, %r1462; | |
mov.u32 %r6165, %r1461; | |
@%p253 bra BB0_503; | |
st.local.u32 [%rd1+992], %r1464; | |
st.local.u32 [%rd1+1008], %r6158; | |
st.local.u32 [%rd1+996], %r1463; | |
st.local.u32 [%rd1+1012], %r6159; | |
st.local.u32 [%rd1+1000], %r1462; | |
st.local.u32 [%rd1+1016], %r6160; | |
st.local.u32 [%rd1+1004], %r1461; | |
st.local.u32 [%rd1+1020], %r6161; | |
mov.u32 %r6073, %r6161; | |
mov.u32 %r6075, %r6160; | |
mov.u32 %r6077, %r6159; | |
mov.u32 %r6079, %r6158; | |
mov.u32 %r6161, %r1461; | |
mov.u32 %r6160, %r1462; | |
mov.u32 %r6159, %r1463; | |
mov.u32 %r6158, %r1464; | |
mov.u32 %r6162, %r6079; | |
mov.u32 %r6163, %r6077; | |
mov.u32 %r6164, %r6075; | |
mov.u32 %r6165, %r6073; | |
BB0_503: | |
mov.u32 %r1472, %r6158; | |
mov.u32 %r1471, %r6159; | |
mov.u32 %r1470, %r6160; | |
mov.u32 %r1469, %r6161; | |
mov.u32 %r1468, %r6162; | |
mov.u32 %r1467, %r6163; | |
mov.u32 %r1466, %r6164; | |
mov.u32 %r1465, %r6165; | |
setp.le.u32 %p254, %r6118, %r1472; | |
mov.u32 %r6126, %r1472; | |
mov.u32 %r6127, %r1471; | |
mov.u32 %r6128, %r1470; | |
mov.u32 %r6129, %r1469; | |
mov.u32 %r6130, %r1468; | |
mov.u32 %r6131, %r1467; | |
mov.u32 %r6132, %r1466; | |
mov.u32 %r6133, %r1465; | |
@%p254 bra BB0_505; | |
st.local.u32 [%rd1+960], %r1472; | |
st.local.u32 [%rd1+992], %r6118; | |
st.local.u32 [%rd1+964], %r1471; | |
st.local.u32 [%rd1+996], %r6119; | |
st.local.u32 [%rd1+968], %r1470; | |
st.local.u32 [%rd1+1000], %r6120; | |
st.local.u32 [%rd1+972], %r1469; | |
st.local.u32 [%rd1+1004], %r6121; | |
st.local.u32 [%rd1+976], %r1468; | |
st.local.u32 [%rd1+1008], %r6122; | |
st.local.u32 [%rd1+980], %r1467; | |
st.local.u32 [%rd1+1012], %r6123; | |
st.local.u32 [%rd1+984], %r1466; | |
st.local.u32 [%rd1+1016], %r6124; | |
st.local.u32 [%rd1+988], %r1465; | |
st.local.u32 [%rd1+1020], %r6125; | |
mov.u32 %r6045, %r6125; | |
mov.u32 %r6047, %r6124; | |
mov.u32 %r6049, %r6123; | |
mov.u32 %r6051, %r6122; | |
mov.u32 %r6053, %r6121; | |
mov.u32 %r6055, %r6120; | |
mov.u32 %r6057, %r6119; | |
mov.u32 %r6059, %r6118; | |
mov.u32 %r6125, %r1465; | |
mov.u32 %r6124, %r1466; | |
mov.u32 %r6123, %r1467; | |
mov.u32 %r6122, %r1468; | |
mov.u32 %r6121, %r1469; | |
mov.u32 %r6120, %r1470; | |
mov.u32 %r6119, %r1471; | |
mov.u32 %r6118, %r1472; | |
mov.u32 %r6126, %r6059; | |
mov.u32 %r6127, %r6057; | |
mov.u32 %r6128, %r6055; | |
mov.u32 %r6129, %r6053; | |
mov.u32 %r6130, %r6051; | |
mov.u32 %r6131, %r6049; | |
mov.u32 %r6132, %r6047; | |
mov.u32 %r6133, %r6045; | |
BB0_505: | |
mov.u32 %r1488, %r6118; | |
setp.le.u32 %p255, %r1401, %r1488; | |
mov.u32 %r6117, %r1401; | |
@%p255 bra BB0_507; | |
st.local.u32 [%rd1+896], %r1488; | |
st.local.u32 [%rd1+960], %r1401; | |
st.local.u32 [%rd1+900], %r6119; | |
st.local.u32 [%rd1+964], %r6183; | |
st.local.u32 [%rd1+904], %r6120; | |
st.local.u32 [%rd1+968], %r6184; | |
st.local.u32 [%rd1+908], %r6121; | |
st.local.u32 [%rd1+972], %r6185; | |
st.local.u32 [%rd1+912], %r6122; | |
st.local.u32 [%rd1+976], %r6186; | |
st.local.u32 [%rd1+916], %r6123; | |
st.local.u32 [%rd1+980], %r6187; | |
st.local.u32 [%rd1+920], %r6124; | |
st.local.u32 [%rd1+984], %r6188; | |
st.local.u32 [%rd1+924], %r6125; | |
st.local.u32 [%rd1+988], %r6189; | |
st.local.u32 [%rd1+928], %r6126; | |
st.local.u32 [%rd1+992], %r6190; | |
st.local.u32 [%rd1+932], %r6127; | |
st.local.u32 [%rd1+996], %r6191; | |
st.local.u32 [%rd1+936], %r6128; | |
st.local.u32 [%rd1+1000], %r6192; | |
st.local.u32 [%rd1+940], %r6129; | |
st.local.u32 [%rd1+1004], %r6193; | |
st.local.u32 [%rd1+944], %r6130; | |
st.local.u32 [%rd1+1008], %r6194; | |
st.local.u32 [%rd1+948], %r6131; | |
st.local.u32 [%rd1+1012], %r6195; | |
st.local.u32 [%rd1+952], %r6132; | |
st.local.u32 [%rd1+1016], %r6196; | |
st.local.u32 [%rd1+956], %r6133; | |
st.local.u32 [%rd1+1020], %r6197; | |
mov.u32 %r6117, %r1488; | |
BB0_507: | |
mov.u32 %r6246, -32; | |
setp.le.u32 %p256, %r6474, %r6117; | |
@%p256 bra BB0_511; | |
mov.u64 %rd1939, %rd1; | |
BB0_509: | |
ld.local.u32 %r3496, [%rd1939+768]; | |
ld.local.u32 %r3497, [%rd1939+896]; | |
ld.local.u32 %r3498, [%rd1939+772]; | |
ld.local.u32 %r3499, [%rd1939+900]; | |
ld.local.u32 %r3500, [%rd1939+776]; | |
ld.local.u32 %r3501, [%rd1939+904]; | |
ld.local.u32 %r3502, [%rd1939+780]; | |
ld.local.u32 %r3503, [%rd1939+908]; | |
ld.local.u32 %r3504, [%rd1939+784]; | |
ld.local.u32 %r3505, [%rd1939+912]; | |
ld.local.u32 %r3506, [%rd1939+788]; | |
ld.local.u32 %r3507, [%rd1939+916]; | |
ld.local.u32 %r3508, [%rd1939+792]; | |
ld.local.u32 %r3509, [%rd1939+920]; | |
ld.local.u32 %r3510, [%rd1939+796]; | |
ld.local.u32 %r3511, [%rd1939+924]; | |
st.local.u32 [%rd1939+768], %r3497; | |
st.local.u32 [%rd1939+896], %r3496; | |
st.local.u32 [%rd1939+772], %r3499; | |
st.local.u32 [%rd1939+900], %r3498; | |
st.local.u32 [%rd1939+776], %r3501; | |
st.local.u32 [%rd1939+904], %r3500; | |
st.local.u32 [%rd1939+780], %r3503; | |
st.local.u32 [%rd1939+908], %r3502; | |
st.local.u32 [%rd1939+784], %r3505; | |
st.local.u32 [%rd1939+912], %r3504; | |
st.local.u32 [%rd1939+788], %r3507; | |
st.local.u32 [%rd1939+916], %r3506; | |
st.local.u32 [%rd1939+792], %r3509; | |
st.local.u32 [%rd1939+920], %r3508; | |
st.local.u32 [%rd1939+796], %r3511; | |
st.local.u32 [%rd1939+924], %r3510; | |
add.s64 %rd1939, %rd1939, 32; | |
add.s32 %r6246, %r6246, 8; | |
setp.ne.s32 %p257, %r6246, 0; | |
@%p257 bra BB0_509; | |
ld.local.u32 %r6474, [%rd1+768]; | |
BB0_511: | |
ld.local.u32 %r6605, [%rd1+512]; | |
mov.u32 %r6604, -64; | |
setp.le.u32 %p258, %r6605, %r6474; | |
@%p258 bra BB0_515; | |
mov.u64 %rd1938, %rd1; | |
BB0_513: | |
ld.local.u32 %r3513, [%rd1938+512]; | |
ld.local.u32 %r3514, [%rd1938+768]; | |
ld.local.u32 %r3515, [%rd1938+516]; | |
ld.local.u32 %r3516, [%rd1938+772]; | |
ld.local.u32 %r3517, [%rd1938+520]; | |
ld.local.u32 %r3518, [%rd1938+776]; | |
ld.local.u32 %r3519, [%rd1938+524]; | |
ld.local.u32 %r3520, [%rd1938+780]; | |
ld.local.u32 %r3521, [%rd1938+528]; | |
ld.local.u32 %r3522, [%rd1938+784]; | |
ld.local.u32 %r3523, [%rd1938+532]; | |
ld.local.u32 %r3524, [%rd1938+788]; | |
ld.local.u32 %r3525, [%rd1938+536]; | |
ld.local.u32 %r3526, [%rd1938+792]; | |
ld.local.u32 %r3527, [%rd1938+540]; | |
ld.local.u32 %r3528, [%rd1938+796]; | |
st.local.u32 [%rd1938+512], %r3514; | |
st.local.u32 [%rd1938+768], %r3513; | |
st.local.u32 [%rd1938+516], %r3516; | |
st.local.u32 [%rd1938+772], %r3515; | |
st.local.u32 [%rd1938+520], %r3518; | |
st.local.u32 [%rd1938+776], %r3517; | |
st.local.u32 [%rd1938+524], %r3520; | |
st.local.u32 [%rd1938+780], %r3519; | |
st.local.u32 [%rd1938+528], %r3522; | |
st.local.u32 [%rd1938+784], %r3521; | |
st.local.u32 [%rd1938+532], %r3524; | |
st.local.u32 [%rd1938+788], %r3523; | |
st.local.u32 [%rd1938+536], %r3526; | |
st.local.u32 [%rd1938+792], %r3525; | |
st.local.u32 [%rd1938+540], %r3528; | |
st.local.u32 [%rd1938+796], %r3527; | |
add.s64 %rd1938, %rd1938, 32; | |
add.s32 %r6604, %r6604, 8; | |
setp.ne.s32 %p259, %r6604, 0; | |
@%p259 bra BB0_513; | |
ld.local.u32 %r6605, [%rd1+512]; | |
BB0_515: | |
ld.local.u32 %r6607, [%rd1]; | |
mov.u32 %r6606, -128; | |
setp.le.u32 %p260, %r6607, %r6605; | |
@%p260 bra BB0_519; | |
mov.u64 %rd1937, %rd1; | |
bra.uni BB0_517; | |
BB0_518: | |
ld.local.u32 %r6607, [%rd1937+64]; | |
add.s64 %rd1937, %rd1937, 64; | |
BB0_517: | |
mov.u32 %r1501, %r6607; | |
ld.local.u32 %r3530, [%rd1937+512]; | |
ld.local.u32 %r3531, [%rd1937+4]; | |
ld.local.u32 %r3532, [%rd1937+516]; | |
ld.local.u32 %r3533, [%rd1937+8]; | |
ld.local.u32 %r3534, [%rd1937+520]; | |
ld.local.u32 %r3535, [%rd1937+12]; | |
ld.local.u32 %r3536, [%rd1937+524]; | |
ld.local.u32 %r3537, [%rd1937+16]; | |
ld.local.u32 %r3538, [%rd1937+528]; | |
ld.local.u32 %r3539, [%rd1937+20]; | |
ld.local.u32 %r3540, [%rd1937+532]; | |
ld.local.u32 %r3541, [%rd1937+24]; | |
ld.local.u32 %r3542, [%rd1937+536]; | |
ld.local.u32 %r3543, [%rd1937+28]; | |
ld.local.u32 %r3544, [%rd1937+540]; | |
ld.local.u32 %r3545, [%rd1937+32]; | |
ld.local.u32 %r3546, [%rd1937+544]; | |
ld.local.u32 %r3547, [%rd1937+36]; | |
ld.local.u32 %r3548, [%rd1937+548]; | |
ld.local.u32 %r3549, [%rd1937+40]; | |
ld.local.u32 %r3550, [%rd1937+552]; | |
ld.local.u32 %r3551, [%rd1937+44]; | |
ld.local.u32 %r3552, [%rd1937+556]; | |
ld.local.u32 %r3553, [%rd1937+48]; | |
ld.local.u32 %r3554, [%rd1937+560]; | |
ld.local.u32 %r3555, [%rd1937+52]; | |
ld.local.u32 %r3556, [%rd1937+564]; | |
st.local.u32 [%rd1937], %r3530; | |
st.local.u32 [%rd1937+512], %r1501; | |
st.local.u32 [%rd1937+4], %r3532; | |
st.local.u32 [%rd1937+516], %r3531; | |
st.local.u32 [%rd1937+8], %r3534; | |
st.local.u32 [%rd1937+520], %r3533; | |
st.local.u32 [%rd1937+12], %r3536; | |
st.local.u32 [%rd1937+524], %r3535; | |
st.local.u32 [%rd1937+16], %r3538; | |
st.local.u32 [%rd1937+528], %r3537; | |
st.local.u32 [%rd1937+20], %r3540; | |
st.local.u32 [%rd1937+532], %r3539; | |
st.local.u32 [%rd1937+24], %r3542; | |
st.local.u32 [%rd1937+536], %r3541; | |
st.local.u32 [%rd1937+28], %r3544; | |
st.local.u32 [%rd1937+540], %r3543; | |
st.local.u32 [%rd1937+32], %r3546; | |
st.local.u32 [%rd1937+544], %r3545; | |
st.local.u32 [%rd1937+36], %r3548; | |
st.local.u32 [%rd1937+548], %r3547; | |
st.local.u32 [%rd1937+40], %r3550; | |
st.local.u32 [%rd1937+552], %r3549; | |
st.local.u32 [%rd1937+44], %r3552; | |
st.local.u32 [%rd1937+556], %r3551; | |
st.local.u32 [%rd1937+48], %r3554; | |
st.local.u32 [%rd1937+560], %r3553; | |
st.local.u32 [%rd1937+52], %r3556; | |
st.local.u32 [%rd1937+564], %r3555; | |
ld.local.u32 %r3557, [%rd1937+56]; | |
ld.local.u32 %r3558, [%rd1937+568]; | |
ld.local.u32 %r3559, [%rd1937+60]; | |
ld.local.u32 %r3560, [%rd1937+572]; | |
st.local.u32 [%rd1937+56], %r3558; | |
st.local.u32 [%rd1937+568], %r3557; | |
st.local.u32 [%rd1937+60], %r3560; | |
st.local.u32 [%rd1937+572], %r3559; | |
add.s32 %r6606, %r6606, 16; | |
setp.eq.s32 %p261, %r6606, 0; | |
@%p261 bra BB0_519; | |
bra.uni BB0_518; | |
BB0_519: | |
ret; | |
} | |
// .globl digitH | |
.entry digitH( | |
.param .u64 .ptr .global .align 8 digitH_param_0, | |
.param .u64 .ptr .global .align 4 digitH_param_1, | |
.param .u64 .ptr .global .align 4 digitH_param_2 | |
) | |
{ | |
.local .align 64 .b8 __local_depot1[384]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<7>; | |
.reg .b16 %rs<69>; | |
.reg .b32 %r<2738>; | |
.reg .b64 %rd<2059>; | |
mov.u64 %rd2058, __local_depot1; | |
cvta.local.u64 %SP, %rd2058; | |
ld.param.u64 %rd208, [digitH_param_1]; | |
ld.param.u64 %rd209, [digitH_param_2]; | |
add.u64 %rd210, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd210; | |
mov.u32 %r10, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r11, %envreg3; | |
mad.lo.s32 %r12, %r10, %r1, %r11; | |
mov.u32 %r13, %tid.x; | |
add.s32 %r2736, %r12, %r13; | |
setp.gt.u32 %p1, %r2736, 1048575; | |
@%p1 bra BB1_10; | |
add.u64 %rd211, %SP, 208; | |
cvta.to.local.u64 %rd212, %rd211; | |
cvt.s64.s32 %rd2057, %r2736; | |
ld.const.s8 %r14, [blake2b_sigma]; | |
mul.wide.s32 %rd213, %r14, 8; | |
add.s64 %rd3, %rd212, %rd213; | |
ld.const.s8 %r15, [blake2b_sigma+1]; | |
mul.wide.s32 %rd214, %r15, 8; | |
add.s64 %rd4, %rd212, %rd214; | |
ld.const.s8 %r16, [blake2b_sigma+2]; | |
mul.wide.s32 %rd215, %r16, 8; | |
add.s64 %rd5, %rd212, %rd215; | |
ld.const.s8 %r17, [blake2b_sigma+3]; | |
mul.wide.s32 %rd216, %r17, 8; | |
add.s64 %rd6, %rd212, %rd216; | |
ld.const.s8 %r18, [blake2b_sigma+4]; | |
mul.wide.s32 %rd217, %r18, 8; | |
add.s64 %rd7, %rd212, %rd217; | |
ld.const.s8 %r19, [blake2b_sigma+5]; | |
mul.wide.s32 %rd218, %r19, 8; | |
add.s64 %rd8, %rd212, %rd218; | |
ld.const.s8 %r20, [blake2b_sigma+6]; | |
mul.wide.s32 %rd219, %r20, 8; | |
add.s64 %rd9, %rd212, %rd219; | |
ld.const.s8 %r21, [blake2b_sigma+7]; | |
mul.wide.s32 %rd220, %r21, 8; | |
add.s64 %rd10, %rd212, %rd220; | |
ld.const.s8 %r22, [blake2b_sigma+8]; | |
mul.wide.s32 %rd221, %r22, 8; | |
add.s64 %rd11, %rd212, %rd221; | |
ld.const.s8 %r23, [blake2b_sigma+9]; | |
mul.wide.s32 %rd222, %r23, 8; | |
add.s64 %rd12, %rd212, %rd222; | |
ld.const.s8 %r24, [blake2b_sigma+10]; | |
mul.wide.s32 %rd223, %r24, 8; | |
add.s64 %rd13, %rd212, %rd223; | |
ld.const.s8 %r25, [blake2b_sigma+11]; | |
mul.wide.s32 %rd224, %r25, 8; | |
add.s64 %rd14, %rd212, %rd224; | |
ld.const.s8 %r26, [blake2b_sigma+12]; | |
mul.wide.s32 %rd225, %r26, 8; | |
add.s64 %rd15, %rd212, %rd225; | |
ld.const.s8 %r27, [blake2b_sigma+13]; | |
mul.wide.s32 %rd226, %r27, 8; | |
add.s64 %rd16, %rd212, %rd226; | |
ld.const.s8 %r28, [blake2b_sigma+14]; | |
mul.wide.s32 %rd227, %r28, 8; | |
add.s64 %rd17, %rd212, %rd227; | |
ld.const.s8 %r29, [blake2b_sigma+15]; | |
mul.wide.s32 %rd228, %r29, 8; | |
add.s64 %rd18, %rd212, %rd228; | |
ld.const.s8 %r30, [blake2b_sigma+16]; | |
mul.wide.s32 %rd229, %r30, 8; | |
add.s64 %rd19, %rd212, %rd229; | |
ld.const.s8 %r31, [blake2b_sigma+17]; | |
mul.wide.s32 %rd230, %r31, 8; | |
add.s64 %rd20, %rd212, %rd230; | |
ld.const.s8 %r32, [blake2b_sigma+18]; | |
mul.wide.s32 %rd231, %r32, 8; | |
add.s64 %rd21, %rd212, %rd231; | |
ld.const.s8 %r33, [blake2b_sigma+19]; | |
mul.wide.s32 %rd232, %r33, 8; | |
add.s64 %rd22, %rd212, %rd232; | |
ld.const.s8 %r34, [blake2b_sigma+20]; | |
mul.wide.s32 %rd233, %r34, 8; | |
add.s64 %rd23, %rd212, %rd233; | |
ld.const.s8 %r35, [blake2b_sigma+21]; | |
mul.wide.s32 %rd234, %r35, 8; | |
add.s64 %rd24, %rd212, %rd234; | |
ld.const.s8 %r36, [blake2b_sigma+22]; | |
mul.wide.s32 %rd235, %r36, 8; | |
add.s64 %rd25, %rd212, %rd235; | |
ld.const.s8 %r37, [blake2b_sigma+23]; | |
mul.wide.s32 %rd236, %r37, 8; | |
add.s64 %rd26, %rd212, %rd236; | |
ld.const.s8 %r38, [blake2b_sigma+24]; | |
mul.wide.s32 %rd237, %r38, 8; | |
add.s64 %rd27, %rd212, %rd237; | |
ld.const.s8 %r39, [blake2b_sigma+25]; | |
mul.wide.s32 %rd238, %r39, 8; | |
add.s64 %rd28, %rd212, %rd238; | |
ld.const.s8 %r40, [blake2b_sigma+26]; | |
mul.wide.s32 %rd239, %r40, 8; | |
add.s64 %rd29, %rd212, %rd239; | |
ld.const.s8 %r41, [blake2b_sigma+27]; | |
mul.wide.s32 %rd240, %r41, 8; | |
add.s64 %rd30, %rd212, %rd240; | |
ld.const.s8 %r42, [blake2b_sigma+28]; | |
mul.wide.s32 %rd241, %r42, 8; | |
add.s64 %rd31, %rd212, %rd241; | |
ld.const.s8 %r43, [blake2b_sigma+29]; | |
mul.wide.s32 %rd242, %r43, 8; | |
add.s64 %rd32, %rd212, %rd242; | |
ld.const.s8 %r44, [blake2b_sigma+30]; | |
mul.wide.s32 %rd243, %r44, 8; | |
add.s64 %rd33, %rd212, %rd243; | |
ld.const.s8 %r45, [blake2b_sigma+31]; | |
mul.wide.s32 %rd244, %r45, 8; | |
add.s64 %rd34, %rd212, %rd244; | |
ld.const.s8 %r46, [blake2b_sigma+32]; | |
mul.wide.s32 %rd245, %r46, 8; | |
add.s64 %rd35, %rd212, %rd245; | |
ld.const.s8 %r47, [blake2b_sigma+33]; | |
mul.wide.s32 %rd246, %r47, 8; | |
add.s64 %rd36, %rd212, %rd246; | |
ld.const.s8 %r48, [blake2b_sigma+34]; | |
mul.wide.s32 %rd247, %r48, 8; | |
add.s64 %rd37, %rd212, %rd247; | |
ld.const.s8 %r49, [blake2b_sigma+35]; | |
mul.wide.s32 %rd248, %r49, 8; | |
add.s64 %rd38, %rd212, %rd248; | |
ld.const.s8 %r50, [blake2b_sigma+36]; | |
mul.wide.s32 %rd249, %r50, 8; | |
add.s64 %rd39, %rd212, %rd249; | |
ld.const.s8 %r51, [blake2b_sigma+37]; | |
mul.wide.s32 %rd250, %r51, 8; | |
add.s64 %rd40, %rd212, %rd250; | |
ld.const.s8 %r52, [blake2b_sigma+38]; | |
mul.wide.s32 %rd251, %r52, 8; | |
add.s64 %rd41, %rd212, %rd251; | |
ld.const.s8 %r53, [blake2b_sigma+39]; | |
mul.wide.s32 %rd252, %r53, 8; | |
add.s64 %rd42, %rd212, %rd252; | |
ld.const.s8 %r54, [blake2b_sigma+40]; | |
mul.wide.s32 %rd253, %r54, 8; | |
add.s64 %rd43, %rd212, %rd253; | |
ld.const.s8 %r55, [blake2b_sigma+41]; | |
mul.wide.s32 %rd254, %r55, 8; | |
add.s64 %rd44, %rd212, %rd254; | |
ld.const.s8 %r56, [blake2b_sigma+42]; | |
mul.wide.s32 %rd255, %r56, 8; | |
add.s64 %rd45, %rd212, %rd255; | |
ld.const.s8 %r57, [blake2b_sigma+43]; | |
mul.wide.s32 %rd256, %r57, 8; | |
add.s64 %rd46, %rd212, %rd256; | |
ld.const.s8 %r58, [blake2b_sigma+44]; | |
mul.wide.s32 %rd257, %r58, 8; | |
add.s64 %rd47, %rd212, %rd257; | |
ld.const.s8 %r59, [blake2b_sigma+45]; | |
mul.wide.s32 %rd258, %r59, 8; | |
add.s64 %rd48, %rd212, %rd258; | |
ld.const.s8 %r60, [blake2b_sigma+46]; | |
mul.wide.s32 %rd259, %r60, 8; | |
add.s64 %rd49, %rd212, %rd259; | |
ld.const.s8 %r61, [blake2b_sigma+47]; | |
mul.wide.s32 %rd260, %r61, 8; | |
add.s64 %rd50, %rd212, %rd260; | |
ld.const.s8 %r62, [blake2b_sigma+48]; | |
mul.wide.s32 %rd261, %r62, 8; | |
add.s64 %rd51, %rd212, %rd261; | |
ld.const.s8 %r63, [blake2b_sigma+49]; | |
mul.wide.s32 %rd262, %r63, 8; | |
add.s64 %rd52, %rd212, %rd262; | |
ld.const.s8 %r64, [blake2b_sigma+50]; | |
mul.wide.s32 %rd263, %r64, 8; | |
add.s64 %rd53, %rd212, %rd263; | |
ld.const.s8 %r65, [blake2b_sigma+51]; | |
mul.wide.s32 %rd264, %r65, 8; | |
add.s64 %rd54, %rd212, %rd264; | |
ld.const.s8 %r66, [blake2b_sigma+52]; | |
mul.wide.s32 %rd265, %r66, 8; | |
add.s64 %rd55, %rd212, %rd265; | |
ld.const.s8 %r67, [blake2b_sigma+53]; | |
mul.wide.s32 %rd266, %r67, 8; | |
add.s64 %rd56, %rd212, %rd266; | |
ld.const.s8 %r68, [blake2b_sigma+54]; | |
mul.wide.s32 %rd267, %r68, 8; | |
add.s64 %rd57, %rd212, %rd267; | |
ld.const.s8 %r69, [blake2b_sigma+55]; | |
mul.wide.s32 %rd268, %r69, 8; | |
add.s64 %rd58, %rd212, %rd268; | |
ld.const.s8 %r70, [blake2b_sigma+56]; | |
mul.wide.s32 %rd269, %r70, 8; | |
add.s64 %rd59, %rd212, %rd269; | |
ld.const.s8 %r71, [blake2b_sigma+57]; | |
mul.wide.s32 %rd270, %r71, 8; | |
add.s64 %rd60, %rd212, %rd270; | |
ld.const.s8 %r72, [blake2b_sigma+58]; | |
mul.wide.s32 %rd271, %r72, 8; | |
add.s64 %rd61, %rd212, %rd271; | |
ld.const.s8 %r73, [blake2b_sigma+59]; | |
mul.wide.s32 %rd272, %r73, 8; | |
add.s64 %rd62, %rd212, %rd272; | |
ld.const.s8 %r74, [blake2b_sigma+60]; | |
mul.wide.s32 %rd273, %r74, 8; | |
add.s64 %rd63, %rd212, %rd273; | |
ld.const.s8 %r75, [blake2b_sigma+61]; | |
mul.wide.s32 %rd274, %r75, 8; | |
add.s64 %rd64, %rd212, %rd274; | |
ld.const.s8 %r76, [blake2b_sigma+62]; | |
mul.wide.s32 %rd275, %r76, 8; | |
add.s64 %rd65, %rd212, %rd275; | |
ld.const.s8 %r77, [blake2b_sigma+63]; | |
mul.wide.s32 %rd276, %r77, 8; | |
add.s64 %rd66, %rd212, %rd276; | |
ld.const.s8 %r78, [blake2b_sigma+64]; | |
mul.wide.s32 %rd277, %r78, 8; | |
add.s64 %rd67, %rd212, %rd277; | |
ld.const.s8 %r79, [blake2b_sigma+65]; | |
mul.wide.s32 %rd278, %r79, 8; | |
add.s64 %rd68, %rd212, %rd278; | |
ld.const.s8 %r80, [blake2b_sigma+66]; | |
mul.wide.s32 %rd279, %r80, 8; | |
add.s64 %rd69, %rd212, %rd279; | |
ld.const.s8 %r81, [blake2b_sigma+67]; | |
mul.wide.s32 %rd280, %r81, 8; | |
add.s64 %rd70, %rd212, %rd280; | |
ld.const.s8 %r82, [blake2b_sigma+68]; | |
mul.wide.s32 %rd281, %r82, 8; | |
add.s64 %rd71, %rd212, %rd281; | |
ld.const.s8 %r83, [blake2b_sigma+69]; | |
mul.wide.s32 %rd282, %r83, 8; | |
add.s64 %rd72, %rd212, %rd282; | |
ld.const.s8 %r84, [blake2b_sigma+70]; | |
mul.wide.s32 %rd283, %r84, 8; | |
add.s64 %rd73, %rd212, %rd283; | |
ld.const.s8 %r85, [blake2b_sigma+71]; | |
mul.wide.s32 %rd284, %r85, 8; | |
add.s64 %rd74, %rd212, %rd284; | |
ld.const.s8 %r86, [blake2b_sigma+72]; | |
mul.wide.s32 %rd285, %r86, 8; | |
add.s64 %rd75, %rd212, %rd285; | |
ld.const.s8 %r87, [blake2b_sigma+73]; | |
mul.wide.s32 %rd286, %r87, 8; | |
add.s64 %rd76, %rd212, %rd286; | |
ld.const.s8 %r88, [blake2b_sigma+74]; | |
mul.wide.s32 %rd287, %r88, 8; | |
add.s64 %rd77, %rd212, %rd287; | |
ld.const.s8 %r89, [blake2b_sigma+75]; | |
mul.wide.s32 %rd288, %r89, 8; | |
add.s64 %rd78, %rd212, %rd288; | |
ld.const.s8 %r90, [blake2b_sigma+76]; | |
mul.wide.s32 %rd289, %r90, 8; | |
add.s64 %rd79, %rd212, %rd289; | |
ld.const.s8 %r91, [blake2b_sigma+77]; | |
mul.wide.s32 %rd290, %r91, 8; | |
add.s64 %rd80, %rd212, %rd290; | |
ld.const.s8 %r92, [blake2b_sigma+78]; | |
mul.wide.s32 %rd291, %r92, 8; | |
add.s64 %rd81, %rd212, %rd291; | |
ld.const.s8 %r93, [blake2b_sigma+79]; | |
mul.wide.s32 %rd292, %r93, 8; | |
add.s64 %rd82, %rd212, %rd292; | |
ld.const.s8 %r94, [blake2b_sigma+80]; | |
mul.wide.s32 %rd293, %r94, 8; | |
add.s64 %rd83, %rd212, %rd293; | |
ld.const.s8 %r95, [blake2b_sigma+81]; | |
mul.wide.s32 %rd294, %r95, 8; | |
add.s64 %rd84, %rd212, %rd294; | |
ld.const.s8 %r96, [blake2b_sigma+82]; | |
mul.wide.s32 %rd295, %r96, 8; | |
add.s64 %rd85, %rd212, %rd295; | |
ld.const.s8 %r97, [blake2b_sigma+83]; | |
mul.wide.s32 %rd296, %r97, 8; | |
add.s64 %rd86, %rd212, %rd296; | |
ld.const.s8 %r98, [blake2b_sigma+84]; | |
mul.wide.s32 %rd297, %r98, 8; | |
add.s64 %rd87, %rd212, %rd297; | |
ld.const.s8 %r99, [blake2b_sigma+85]; | |
mul.wide.s32 %rd298, %r99, 8; | |
add.s64 %rd88, %rd212, %rd298; | |
ld.const.s8 %r100, [blake2b_sigma+86]; | |
mul.wide.s32 %rd299, %r100, 8; | |
add.s64 %rd89, %rd212, %rd299; | |
ld.const.s8 %r101, [blake2b_sigma+87]; | |
mul.wide.s32 %rd300, %r101, 8; | |
add.s64 %rd90, %rd212, %rd300; | |
ld.const.s8 %r102, [blake2b_sigma+88]; | |
mul.wide.s32 %rd301, %r102, 8; | |
add.s64 %rd91, %rd212, %rd301; | |
ld.const.s8 %r103, [blake2b_sigma+89]; | |
mul.wide.s32 %rd302, %r103, 8; | |
add.s64 %rd92, %rd212, %rd302; | |
ld.const.s8 %r104, [blake2b_sigma+90]; | |
mul.wide.s32 %rd303, %r104, 8; | |
add.s64 %rd93, %rd212, %rd303; | |
ld.const.s8 %r105, [blake2b_sigma+91]; | |
mul.wide.s32 %rd304, %r105, 8; | |
add.s64 %rd94, %rd212, %rd304; | |
ld.const.s8 %r106, [blake2b_sigma+92]; | |
mul.wide.s32 %rd305, %r106, 8; | |
add.s64 %rd95, %rd212, %rd305; | |
ld.const.s8 %r107, [blake2b_sigma+93]; | |
mul.wide.s32 %rd306, %r107, 8; | |
add.s64 %rd96, %rd212, %rd306; | |
ld.const.s8 %r108, [blake2b_sigma+94]; | |
mul.wide.s32 %rd307, %r108, 8; | |
add.s64 %rd97, %rd212, %rd307; | |
ld.const.s8 %r109, [blake2b_sigma+95]; | |
mul.wide.s32 %rd308, %r109, 8; | |
add.s64 %rd98, %rd212, %rd308; | |
ld.const.s8 %r110, [blake2b_sigma+96]; | |
mul.wide.s32 %rd309, %r110, 8; | |
add.s64 %rd99, %rd212, %rd309; | |
ld.const.s8 %r111, [blake2b_sigma+97]; | |
mul.wide.s32 %rd310, %r111, 8; | |
add.s64 %rd100, %rd212, %rd310; | |
ld.const.s8 %r112, [blake2b_sigma+98]; | |
mul.wide.s32 %rd311, %r112, 8; | |
add.s64 %rd101, %rd212, %rd311; | |
ld.const.s8 %r113, [blake2b_sigma+99]; | |
mul.wide.s32 %rd312, %r113, 8; | |
add.s64 %rd102, %rd212, %rd312; | |
ld.const.s8 %r114, [blake2b_sigma+100]; | |
mul.wide.s32 %rd313, %r114, 8; | |
add.s64 %rd103, %rd212, %rd313; | |
ld.const.s8 %r115, [blake2b_sigma+101]; | |
mul.wide.s32 %rd314, %r115, 8; | |
add.s64 %rd104, %rd212, %rd314; | |
ld.const.s8 %r116, [blake2b_sigma+102]; | |
mul.wide.s32 %rd315, %r116, 8; | |
add.s64 %rd105, %rd212, %rd315; | |
ld.const.s8 %r117, [blake2b_sigma+103]; | |
mul.wide.s32 %rd316, %r117, 8; | |
add.s64 %rd106, %rd212, %rd316; | |
ld.const.s8 %r118, [blake2b_sigma+104]; | |
mul.wide.s32 %rd317, %r118, 8; | |
add.s64 %rd107, %rd212, %rd317; | |
ld.const.s8 %r119, [blake2b_sigma+105]; | |
mul.wide.s32 %rd318, %r119, 8; | |
add.s64 %rd108, %rd212, %rd318; | |
ld.const.s8 %r120, [blake2b_sigma+106]; | |
mul.wide.s32 %rd319, %r120, 8; | |
add.s64 %rd109, %rd212, %rd319; | |
ld.const.s8 %r121, [blake2b_sigma+107]; | |
mul.wide.s32 %rd320, %r121, 8; | |
add.s64 %rd110, %rd212, %rd320; | |
ld.const.s8 %r122, [blake2b_sigma+108]; | |
mul.wide.s32 %rd321, %r122, 8; | |
add.s64 %rd111, %rd212, %rd321; | |
ld.const.s8 %r123, [blake2b_sigma+109]; | |
mul.wide.s32 %rd322, %r123, 8; | |
add.s64 %rd112, %rd212, %rd322; | |
ld.const.s8 %r124, [blake2b_sigma+110]; | |
mul.wide.s32 %rd323, %r124, 8; | |
add.s64 %rd113, %rd212, %rd323; | |
ld.const.s8 %r125, [blake2b_sigma+111]; | |
mul.wide.s32 %rd324, %r125, 8; | |
add.s64 %rd114, %rd212, %rd324; | |
ld.const.s8 %r126, [blake2b_sigma+112]; | |
mul.wide.s32 %rd325, %r126, 8; | |
add.s64 %rd115, %rd212, %rd325; | |
ld.const.s8 %r127, [blake2b_sigma+113]; | |
mul.wide.s32 %rd326, %r127, 8; | |
add.s64 %rd116, %rd212, %rd326; | |
ld.const.s8 %r128, [blake2b_sigma+114]; | |
mul.wide.s32 %rd327, %r128, 8; | |
add.s64 %rd117, %rd212, %rd327; | |
ld.const.s8 %r129, [blake2b_sigma+115]; | |
mul.wide.s32 %rd328, %r129, 8; | |
add.s64 %rd118, %rd212, %rd328; | |
ld.const.s8 %r130, [blake2b_sigma+116]; | |
mul.wide.s32 %rd329, %r130, 8; | |
add.s64 %rd119, %rd212, %rd329; | |
ld.const.s8 %r131, [blake2b_sigma+117]; | |
mul.wide.s32 %rd330, %r131, 8; | |
add.s64 %rd120, %rd212, %rd330; | |
ld.const.s8 %r132, [blake2b_sigma+118]; | |
mul.wide.s32 %rd331, %r132, 8; | |
add.s64 %rd121, %rd212, %rd331; | |
ld.const.s8 %r133, [blake2b_sigma+119]; | |
mul.wide.s32 %rd332, %r133, 8; | |
add.s64 %rd122, %rd212, %rd332; | |
ld.const.s8 %r134, [blake2b_sigma+120]; | |
mul.wide.s32 %rd333, %r134, 8; | |
add.s64 %rd123, %rd212, %rd333; | |
ld.const.s8 %r135, [blake2b_sigma+121]; | |
mul.wide.s32 %rd334, %r135, 8; | |
add.s64 %rd124, %rd212, %rd334; | |
ld.const.s8 %r136, [blake2b_sigma+122]; | |
mul.wide.s32 %rd335, %r136, 8; | |
add.s64 %rd125, %rd212, %rd335; | |
ld.const.s8 %r137, [blake2b_sigma+123]; | |
mul.wide.s32 %rd336, %r137, 8; | |
add.s64 %rd126, %rd212, %rd336; | |
ld.const.s8 %r138, [blake2b_sigma+124]; | |
mul.wide.s32 %rd337, %r138, 8; | |
add.s64 %rd127, %rd212, %rd337; | |
ld.const.s8 %r139, [blake2b_sigma+125]; | |
mul.wide.s32 %rd338, %r139, 8; | |
add.s64 %rd128, %rd212, %rd338; | |
ld.const.s8 %r140, [blake2b_sigma+126]; | |
mul.wide.s32 %rd339, %r140, 8; | |
add.s64 %rd129, %rd212, %rd339; | |
ld.const.s8 %r141, [blake2b_sigma+127]; | |
mul.wide.s32 %rd340, %r141, 8; | |
add.s64 %rd130, %rd212, %rd340; | |
ld.const.s8 %r142, [blake2b_sigma+128]; | |
mul.wide.s32 %rd341, %r142, 8; | |
add.s64 %rd131, %rd212, %rd341; | |
ld.const.s8 %r143, [blake2b_sigma+129]; | |
mul.wide.s32 %rd342, %r143, 8; | |
add.s64 %rd132, %rd212, %rd342; | |
ld.const.s8 %r144, [blake2b_sigma+130]; | |
mul.wide.s32 %rd343, %r144, 8; | |
add.s64 %rd133, %rd212, %rd343; | |
ld.const.s8 %r145, [blake2b_sigma+131]; | |
mul.wide.s32 %rd344, %r145, 8; | |
add.s64 %rd134, %rd212, %rd344; | |
ld.const.s8 %r146, [blake2b_sigma+132]; | |
mul.wide.s32 %rd345, %r146, 8; | |
add.s64 %rd135, %rd212, %rd345; | |
ld.const.s8 %r147, [blake2b_sigma+133]; | |
mul.wide.s32 %rd346, %r147, 8; | |
add.s64 %rd136, %rd212, %rd346; | |
ld.const.s8 %r148, [blake2b_sigma+134]; | |
mul.wide.s32 %rd347, %r148, 8; | |
add.s64 %rd137, %rd212, %rd347; | |
ld.const.s8 %r149, [blake2b_sigma+135]; | |
mul.wide.s32 %rd348, %r149, 8; | |
add.s64 %rd138, %rd212, %rd348; | |
ld.const.s8 %r150, [blake2b_sigma+136]; | |
mul.wide.s32 %rd349, %r150, 8; | |
add.s64 %rd139, %rd212, %rd349; | |
ld.const.s8 %r151, [blake2b_sigma+137]; | |
mul.wide.s32 %rd350, %r151, 8; | |
add.s64 %rd140, %rd212, %rd350; | |
ld.const.s8 %r152, [blake2b_sigma+138]; | |
mul.wide.s32 %rd351, %r152, 8; | |
add.s64 %rd141, %rd212, %rd351; | |
ld.const.s8 %r153, [blake2b_sigma+139]; | |
mul.wide.s32 %rd352, %r153, 8; | |
add.s64 %rd142, %rd212, %rd352; | |
ld.const.s8 %r154, [blake2b_sigma+140]; | |
mul.wide.s32 %rd353, %r154, 8; | |
add.s64 %rd143, %rd212, %rd353; | |
ld.const.s8 %r155, [blake2b_sigma+141]; | |
mul.wide.s32 %rd354, %r155, 8; | |
add.s64 %rd144, %rd212, %rd354; | |
ld.const.s8 %r156, [blake2b_sigma+142]; | |
mul.wide.s32 %rd355, %r156, 8; | |
add.s64 %rd145, %rd212, %rd355; | |
ld.const.s8 %r157, [blake2b_sigma+143]; | |
mul.wide.s32 %rd356, %r157, 8; | |
add.s64 %rd146, %rd212, %rd356; | |
ld.const.s8 %r158, [blake2b_sigma+144]; | |
mul.wide.s32 %rd357, %r158, 8; | |
add.s64 %rd147, %rd212, %rd357; | |
ld.const.s8 %r159, [blake2b_sigma+145]; | |
mul.wide.s32 %rd358, %r159, 8; | |
add.s64 %rd148, %rd212, %rd358; | |
ld.const.s8 %r160, [blake2b_sigma+146]; | |
mul.wide.s32 %rd359, %r160, 8; | |
add.s64 %rd149, %rd212, %rd359; | |
ld.const.s8 %r161, [blake2b_sigma+147]; | |
mul.wide.s32 %rd360, %r161, 8; | |
add.s64 %rd150, %rd212, %rd360; | |
ld.const.s8 %r162, [blake2b_sigma+148]; | |
mul.wide.s32 %rd361, %r162, 8; | |
add.s64 %rd151, %rd212, %rd361; | |
ld.const.s8 %r163, [blake2b_sigma+149]; | |
mul.wide.s32 %rd362, %r163, 8; | |
add.s64 %rd152, %rd212, %rd362; | |
ld.const.s8 %r164, [blake2b_sigma+150]; | |
mul.wide.s32 %rd363, %r164, 8; | |
add.s64 %rd153, %rd212, %rd363; | |
ld.const.s8 %r165, [blake2b_sigma+151]; | |
mul.wide.s32 %rd364, %r165, 8; | |
add.s64 %rd154, %rd212, %rd364; | |
ld.const.s8 %r166, [blake2b_sigma+152]; | |
mul.wide.s32 %rd365, %r166, 8; | |
add.s64 %rd155, %rd212, %rd365; | |
ld.const.s8 %r167, [blake2b_sigma+153]; | |
mul.wide.s32 %rd366, %r167, 8; | |
add.s64 %rd156, %rd212, %rd366; | |
ld.const.s8 %r168, [blake2b_sigma+154]; | |
mul.wide.s32 %rd367, %r168, 8; | |
add.s64 %rd157, %rd212, %rd367; | |
ld.const.s8 %r169, [blake2b_sigma+155]; | |
mul.wide.s32 %rd368, %r169, 8; | |
add.s64 %rd158, %rd212, %rd368; | |
ld.const.s8 %r170, [blake2b_sigma+156]; | |
mul.wide.s32 %rd369, %r170, 8; | |
add.s64 %rd159, %rd212, %rd369; | |
ld.const.s8 %r171, [blake2b_sigma+157]; | |
mul.wide.s32 %rd370, %r171, 8; | |
add.s64 %rd160, %rd212, %rd370; | |
ld.const.s8 %r172, [blake2b_sigma+158]; | |
mul.wide.s32 %rd371, %r172, 8; | |
add.s64 %rd161, %rd212, %rd371; | |
ld.const.s8 %r173, [blake2b_sigma+159]; | |
mul.wide.s32 %rd372, %r173, 8; | |
add.s64 %rd162, %rd212, %rd372; | |
ld.const.s8 %r174, [blake2b_sigma+160]; | |
mul.wide.s32 %rd373, %r174, 8; | |
add.s64 %rd163, %rd212, %rd373; | |
ld.const.s8 %r175, [blake2b_sigma+161]; | |
mul.wide.s32 %rd374, %r175, 8; | |
add.s64 %rd164, %rd212, %rd374; | |
ld.const.s8 %r176, [blake2b_sigma+162]; | |
mul.wide.s32 %rd375, %r176, 8; | |
add.s64 %rd165, %rd212, %rd375; | |
ld.const.s8 %r177, [blake2b_sigma+163]; | |
mul.wide.s32 %rd376, %r177, 8; | |
add.s64 %rd166, %rd212, %rd376; | |
ld.const.s8 %r178, [blake2b_sigma+164]; | |
mul.wide.s32 %rd377, %r178, 8; | |
add.s64 %rd167, %rd212, %rd377; | |
ld.const.s8 %r179, [blake2b_sigma+165]; | |
mul.wide.s32 %rd378, %r179, 8; | |
add.s64 %rd168, %rd212, %rd378; | |
ld.const.s8 %r180, [blake2b_sigma+166]; | |
mul.wide.s32 %rd379, %r180, 8; | |
add.s64 %rd169, %rd212, %rd379; | |
ld.const.s8 %r181, [blake2b_sigma+167]; | |
mul.wide.s32 %rd380, %r181, 8; | |
add.s64 %rd170, %rd212, %rd380; | |
ld.const.s8 %r182, [blake2b_sigma+168]; | |
mul.wide.s32 %rd381, %r182, 8; | |
add.s64 %rd171, %rd212, %rd381; | |
ld.const.s8 %r183, [blake2b_sigma+169]; | |
mul.wide.s32 %rd382, %r183, 8; | |
add.s64 %rd172, %rd212, %rd382; | |
ld.const.s8 %r184, [blake2b_sigma+170]; | |
mul.wide.s32 %rd383, %r184, 8; | |
add.s64 %rd173, %rd212, %rd383; | |
ld.const.s8 %r185, [blake2b_sigma+171]; | |
mul.wide.s32 %rd384, %r185, 8; | |
add.s64 %rd174, %rd212, %rd384; | |
ld.const.s8 %r186, [blake2b_sigma+172]; | |
mul.wide.s32 %rd385, %r186, 8; | |
add.s64 %rd175, %rd212, %rd385; | |
ld.const.s8 %r187, [blake2b_sigma+173]; | |
mul.wide.s32 %rd386, %r187, 8; | |
add.s64 %rd176, %rd212, %rd386; | |
ld.const.s8 %r188, [blake2b_sigma+174]; | |
mul.wide.s32 %rd387, %r188, 8; | |
add.s64 %rd177, %rd212, %rd387; | |
ld.const.s8 %r189, [blake2b_sigma+175]; | |
mul.wide.s32 %rd388, %r189, 8; | |
add.s64 %rd178, %rd212, %rd388; | |
ld.const.s8 %r190, [blake2b_sigma+176]; | |
mul.wide.s32 %rd389, %r190, 8; | |
add.s64 %rd179, %rd212, %rd389; | |
ld.const.s8 %r191, [blake2b_sigma+177]; | |
mul.wide.s32 %rd390, %r191, 8; | |
add.s64 %rd180, %rd212, %rd390; | |
ld.const.s8 %r192, [blake2b_sigma+178]; | |
mul.wide.s32 %rd391, %r192, 8; | |
add.s64 %rd181, %rd212, %rd391; | |
ld.const.s8 %r193, [blake2b_sigma+179]; | |
mul.wide.s32 %rd392, %r193, 8; | |
add.s64 %rd182, %rd212, %rd392; | |
ld.const.s8 %r194, [blake2b_sigma+180]; | |
mul.wide.s32 %rd393, %r194, 8; | |
add.s64 %rd183, %rd212, %rd393; | |
ld.const.s8 %r195, [blake2b_sigma+181]; | |
mul.wide.s32 %rd394, %r195, 8; | |
add.s64 %rd184, %rd212, %rd394; | |
ld.const.s8 %r196, [blake2b_sigma+182]; | |
mul.wide.s32 %rd395, %r196, 8; | |
add.s64 %rd185, %rd212, %rd395; | |
ld.const.s8 %r197, [blake2b_sigma+183]; | |
mul.wide.s32 %rd396, %r197, 8; | |
add.s64 %rd186, %rd212, %rd396; | |
ld.const.s8 %r198, [blake2b_sigma+184]; | |
mul.wide.s32 %rd397, %r198, 8; | |
add.s64 %rd187, %rd212, %rd397; | |
ld.const.s8 %r199, [blake2b_sigma+185]; | |
mul.wide.s32 %rd398, %r199, 8; | |
add.s64 %rd188, %rd212, %rd398; | |
ld.const.s8 %r200, [blake2b_sigma+186]; | |
mul.wide.s32 %rd399, %r200, 8; | |
add.s64 %rd189, %rd212, %rd399; | |
ld.const.s8 %r201, [blake2b_sigma+187]; | |
mul.wide.s32 %rd400, %r201, 8; | |
add.s64 %rd190, %rd212, %rd400; | |
ld.const.s8 %r202, [blake2b_sigma+188]; | |
mul.wide.s32 %rd401, %r202, 8; | |
add.s64 %rd191, %rd212, %rd401; | |
ld.const.s8 %r203, [blake2b_sigma+189]; | |
mul.wide.s32 %rd402, %r203, 8; | |
add.s64 %rd192, %rd212, %rd402; | |
ld.const.s8 %r204, [blake2b_sigma+190]; | |
mul.wide.s32 %rd403, %r204, 8; | |
add.s64 %rd193, %rd212, %rd403; | |
ld.const.s8 %r205, [blake2b_sigma+191]; | |
mul.wide.s32 %rd404, %r205, 8; | |
add.s64 %rd194, %rd212, %rd404; | |
mov.b32 %r206, %envreg6; | |
mul.lo.s32 %r207, %r1, %r206; | |
cvt.s64.s32 %rd195, %r207; | |
BB1_2: | |
ld.param.u64 %rd2053, [digitH_param_0]; | |
ld.global.v2.u64 {%rd407, %rd408}, [%rd2053]; | |
ld.global.v2.u64 {%rd411, %rd412}, [%rd2053+16]; | |
ld.global.v2.u64 {%rd415, %rd416}, [%rd2053+32]; | |
ld.global.v2.u64 {%rd419, %rd420}, [%rd2053+48]; | |
st.local.v2.u64 [%rd1+48], {%rd419, %rd420}; | |
st.local.v2.u64 [%rd1+32], {%rd415, %rd416}; | |
st.local.v2.u64 [%rd1+16], {%rd411, %rd412}; | |
st.local.v2.u64 [%rd1], {%rd407, %rd408}; | |
ld.global.v2.u64 {%rd423, %rd424}, [%rd2053+64]; | |
ld.global.v2.u64 {%rd427, %rd428}, [%rd2053+80]; | |
ld.global.v2.u64 {%rd431, %rd432}, [%rd2053+96]; | |
ld.global.v2.u64 {%rd435, %rd436}, [%rd2053+112]; | |
add.s64 %rd439, %rd1, 64; | |
st.local.v2.u64 [%rd1+112], {%rd435, %rd436}; | |
st.local.v2.u64 [%rd1+96], {%rd431, %rd432}; | |
st.local.v2.u64 [%rd1+80], {%rd427, %rd428}; | |
st.local.v2.u64 [%rd1+64], {%rd423, %rd424}; | |
ld.global.v2.u64 {%rd440, %rd441}, [%rd2053+128]; | |
ld.global.v2.u64 {%rd444, %rd445}, [%rd2053+144]; | |
ld.global.v2.u64 {%rd448, %rd449}, [%rd2053+160]; | |
ld.global.v2.u64 {%rd452, %rd453}, [%rd2053+176]; | |
st.local.v2.u64 [%rd1+176], {%rd452, %rd453}; | |
st.local.v2.u64 [%rd1+160], {%rd448, %rd449}; | |
st.local.v2.u64 [%rd1+144], {%rd444, %rd445}; | |
st.local.v2.u64 [%rd1+128], {%rd440, %rd441}; | |
ld.global.v4.u8 {%rs49, %rs50, %rs51, %rs52}, [%rd2053+192]; | |
st.local.v4.u8 [%rd1+192], {%rs49, %rs50, %rs51, %rs52}; | |
ld.global.u8 %rd456, [%rd2053+194]; | |
add.s64 %rd457, %rd439, %rd456; | |
st.local.u32 [%rd457], %r2736; | |
ld.local.u8 %r209, [%rd1+194]; | |
add.s32 %r210, %r209, 4; | |
cvt.u16.u32 %rs67, %r210; | |
and.b16 %rs57, %rs67, 255; | |
st.local.u8 [%rd1+194], %rs67; | |
and.b32 %r211, %r210, 255; | |
ld.local.u16 %r212, [%rd1+192]; | |
add.s32 %r213, %r211, %r212; | |
cvt.u16.u32 %rs68, %r213; | |
st.local.u16 [%rd1+192], %rs68; | |
setp.eq.s16 %p2, %rs57, 128; | |
mov.u32 %r2737, 0; | |
@%p2 bra BB1_5; | |
BB1_3: | |
cvt.u32.u16 %r214, %rs67; | |
and.b32 %r215, %r214, 255; | |
add.s32 %r216, %r215, %r2737; | |
cvt.u64.u32 %rd458, %r216; | |
add.s64 %rd459, %rd1, %rd458; | |
mov.u16 %rs58, 0; | |
st.local.u8 [%rd459+64], %rs58; | |
ld.local.u8 %rs67, [%rd1+194]; | |
cvt.u32.u16 %r217, %rs67; | |
and.b32 %r218, %r217, 255; | |
mov.u32 %r219, 128; | |
sub.s32 %r220, %r219, %r218; | |
add.s32 %r2737, %r2737, 1; | |
setp.lt.u32 %p3, %r2737, %r220; | |
@%p3 bra BB1_3; | |
ld.local.u16 %rs68, [%rd1+192]; | |
BB1_5: | |
add.s64 %rd2056, %rd1, 1; | |
add.u64 %rd2055, %SP, 208; | |
cvta.to.local.u64 %rd2054, %rd2055; | |
ld.local.u64 %rd462, [%rd1+64]; | |
ld.local.u64 %rd463, [%rd1+72]; | |
ld.local.u64 %rd464, [%rd1+80]; | |
ld.local.u64 %rd465, [%rd1+88]; | |
ld.local.u64 %rd466, [%rd1+96]; | |
ld.local.u64 %rd467, [%rd1+104]; | |
ld.local.u64 %rd468, [%rd1+112]; | |
ld.local.u64 %rd469, [%rd1+120]; | |
ld.local.u64 %rd470, [%rd1+128]; | |
ld.local.u64 %rd471, [%rd1+136]; | |
ld.local.u64 %rd472, [%rd1+144]; | |
ld.local.u64 %rd473, [%rd1+152]; | |
ld.local.u64 %rd474, [%rd1+160]; | |
ld.local.u64 %rd475, [%rd1+168]; | |
ld.local.u64 %rd476, [%rd1+176]; | |
ld.local.u64 %rd477, [%rd1+184]; | |
st.local.u64 [%rd2054], %rd462; | |
st.local.u64 [%rd2054+8], %rd463; | |
st.local.u64 [%rd2054+16], %rd464; | |
st.local.u64 [%rd2054+24], %rd465; | |
st.local.u64 [%rd2054+32], %rd466; | |
st.local.u64 [%rd2054+40], %rd467; | |
st.local.u64 [%rd2054+48], %rd468; | |
st.local.u64 [%rd2054+56], %rd469; | |
st.local.u64 [%rd2054+64], %rd470; | |
st.local.u64 [%rd2054+72], %rd471; | |
st.local.u64 [%rd2054+80], %rd472; | |
st.local.u64 [%rd2054+88], %rd473; | |
st.local.u64 [%rd2054+96], %rd474; | |
st.local.u64 [%rd2054+104], %rd475; | |
st.local.u64 [%rd2054+112], %rd476; | |
st.local.u64 [%rd2054+120], %rd477; | |
cvt.u64.u16 %rd478, %rs68; | |
ld.local.u64 %rd479, [%rd1+32]; | |
ld.local.u64 %rd480, [%rd1]; | |
add.s64 %rd481, %rd479, %rd480; | |
ld.local.u64 %rd482, [%rd3]; | |
add.s64 %rd483, %rd481, %rd482; | |
xor.b64 %rd484, %rd478, %rd483; | |
xor.b64 %rd485, %rd484, 5840696475078001361; | |
mov.b64 {%r221, %r222}, %rd485; | |
mov.b64 %rd486, {%r222, %r221}; | |
add.s64 %rd487, %rd486, 7640891576956012808; | |
xor.b64 %rd488, %rd487, %rd479; | |
mov.b64 {%r223, %r224}, %rd488; | |
shr.u32 %r225, %r224, 24; | |
shl.b32 %r226, %r223, 8; | |
shr.u32 %r227, %r223, 24; | |
shl.b32 %r228, %r224, 8; | |
or.b32 %r229, %r225, %r226; | |
or.b32 %r230, %r227, %r228; | |
mov.b64 %rd489, {%r230, %r229}; | |
ld.local.u64 %rd490, [%rd4]; | |
add.s64 %rd491, %rd490, %rd483; | |
add.s64 %rd492, %rd491, %rd489; | |
xor.b64 %rd493, %rd492, %rd486; | |
mov.b64 {%r231, %r232}, %rd493; | |
shr.u32 %r233, %r232, 16; | |
shl.b32 %r234, %r231, 16; | |
shr.u32 %r235, %r231, 16; | |
shl.b32 %r236, %r232, 16; | |
or.b32 %r237, %r233, %r234; | |
or.b32 %r238, %r235, %r236; | |
mov.b64 %rd494, {%r238, %r237}; | |
add.s64 %rd495, %rd494, %rd487; | |
xor.b64 %rd496, %rd495, %rd489; | |
mov.b64 {%r239, %r240}, %rd496; | |
shr.u32 %r241, %r239, 31; | |
shl.b32 %r242, %r240, 1; | |
shr.u32 %r243, %r240, 31; | |
shl.b32 %r244, %r239, 1; | |
or.b32 %r245, %r241, %r242; | |
or.b32 %r246, %r243, %r244; | |
mov.b64 %rd497, {%r246, %r245}; | |
ld.local.u64 %rd498, [%rd1+40]; | |
ld.local.u64 %rd499, [%rd1+8]; | |
add.s64 %rd500, %rd498, %rd499; | |
ld.local.u64 %rd501, [%rd5]; | |
add.s64 %rd502, %rd500, %rd501; | |
xor.b64 %rd503, %rd502, -7276294671716946913; | |
mov.b64 {%r247, %r248}, %rd503; | |
mov.b64 %rd504, {%r248, %r247}; | |
add.s64 %rd505, %rd504, -4942790177534073029; | |
xor.b64 %rd506, %rd505, %rd498; | |
mov.b64 {%r249, %r250}, %rd506; | |
shr.u32 %r251, %r250, 24; | |
shl.b32 %r252, %r249, 8; | |
shr.u32 %r253, %r249, 24; | |
shl.b32 %r254, %r250, 8; | |
or.b32 %r255, %r251, %r252; | |
or.b32 %r256, %r253, %r254; | |
mov.b64 %rd507, {%r256, %r255}; | |
ld.local.u64 %rd508, [%rd6]; | |
add.s64 %rd509, %rd508, %rd502; | |
add.s64 %rd510, %rd509, %rd507; | |
xor.b64 %rd511, %rd510, %rd504; | |
mov.b64 {%r257, %r258}, %rd511; | |
shr.u32 %r259, %r258, 16; | |
shl.b32 %r260, %r257, 16; | |
shr.u32 %r261, %r257, 16; | |
shl.b32 %r262, %r258, 16; | |
or.b32 %r263, %r259, %r260; | |
or.b32 %r264, %r261, %r262; | |
mov.b64 %rd512, {%r264, %r263}; | |
add.s64 %rd513, %rd512, %rd505; | |
xor.b64 %rd514, %rd513, %rd507; | |
mov.b64 {%r265, %r266}, %rd514; | |
shr.u32 %r267, %r265, 31; | |
shl.b32 %r268, %r266, 1; | |
shr.u32 %r269, %r266, 31; | |
shl.b32 %r270, %r265, 1; | |
or.b32 %r271, %r267, %r268; | |
or.b32 %r272, %r269, %r270; | |
mov.b64 %rd515, {%r272, %r271}; | |
ld.local.u64 %rd516, [%rd1+48]; | |
ld.local.u64 %rd517, [%rd1+16]; | |
add.s64 %rd518, %rd516, %rd517; | |
ld.local.u64 %rd519, [%rd7]; | |
add.s64 %rd520, %rd518, %rd519; | |
xor.b64 %rd521, %rd520, -2270897969802886508; | |
mov.b64 {%r273, %r274}, %rd521; | |
mov.b64 %rd522, {%r274, %r273}; | |
add.s64 %rd523, %rd522, 4354685564936845355; | |
xor.b64 %rd524, %rd523, %rd516; | |
mov.b64 {%r275, %r276}, %rd524; | |
shr.u32 %r277, %r276, 24; | |
shl.b32 %r278, %r275, 8; | |
shr.u32 %r279, %r275, 24; | |
shl.b32 %r280, %r276, 8; | |
or.b32 %r281, %r277, %r278; | |
or.b32 %r282, %r279, %r280; | |
mov.b64 %rd525, {%r282, %r281}; | |
ld.local.u64 %rd526, [%rd8]; | |
add.s64 %rd527, %rd526, %rd520; | |
add.s64 %rd528, %rd527, %rd525; | |
xor.b64 %rd529, %rd528, %rd522; | |
mov.b64 {%r283, %r284}, %rd529; | |
shr.u32 %r285, %r284, 16; | |
shl.b32 %r286, %r283, 16; | |
shr.u32 %r287, %r283, 16; | |
shl.b32 %r288, %r284, 16; | |
or.b32 %r289, %r285, %r286; | |
or.b32 %r290, %r287, %r288; | |
mov.b64 %rd530, {%r290, %r289}; | |
add.s64 %rd531, %rd530, %rd523; | |
xor.b64 %rd532, %rd531, %rd525; | |
mov.b64 {%r291, %r292}, %rd532; | |
shr.u32 %r293, %r291, 31; | |
shl.b32 %r294, %r292, 1; | |
shr.u32 %r295, %r292, 31; | |
shl.b32 %r296, %r291, 1; | |
or.b32 %r297, %r293, %r294; | |
or.b32 %r298, %r295, %r296; | |
mov.b64 %rd533, {%r298, %r297}; | |
ld.local.u64 %rd534, [%rd1+56]; | |
ld.local.u64 %rd535, [%rd1+24]; | |
add.s64 %rd536, %rd534, %rd535; | |
ld.local.u64 %rd537, [%rd9]; | |
add.s64 %rd538, %rd536, %rd537; | |
xor.b64 %rd539, %rd538, 6620516959819538809; | |
mov.b64 {%r299, %r300}, %rd539; | |
mov.b64 %rd540, {%r300, %r299}; | |
add.s64 %rd541, %rd540, -6534734903238641935; | |
xor.b64 %rd542, %rd541, %rd534; | |
mov.b64 {%r301, %r302}, %rd542; | |
shr.u32 %r303, %r302, 24; | |
shl.b32 %r304, %r301, 8; | |
shr.u32 %r305, %r301, 24; | |
shl.b32 %r306, %r302, 8; | |
or.b32 %r307, %r303, %r304; | |
or.b32 %r308, %r305, %r306; | |
mov.b64 %rd543, {%r308, %r307}; | |
ld.local.u64 %rd544, [%rd10]; | |
add.s64 %rd545, %rd544, %rd538; | |
add.s64 %rd546, %rd545, %rd543; | |
xor.b64 %rd547, %rd546, %rd540; | |
mov.b64 {%r309, %r310}, %rd547; | |
shr.u32 %r311, %r310, 16; | |
shl.b32 %r312, %r309, 16; | |
shr.u32 %r313, %r309, 16; | |
shl.b32 %r314, %r310, 16; | |
or.b32 %r315, %r311, %r312; | |
or.b32 %r316, %r313, %r314; | |
mov.b64 %rd548, {%r316, %r315}; | |
add.s64 %rd549, %rd548, %rd541; | |
xor.b64 %rd550, %rd549, %rd543; | |
mov.b64 {%r317, %r318}, %rd550; | |
shr.u32 %r319, %r317, 31; | |
shl.b32 %r320, %r318, 1; | |
shr.u32 %r321, %r318, 31; | |
shl.b32 %r322, %r317, 1; | |
or.b32 %r323, %r319, %r320; | |
or.b32 %r324, %r321, %r322; | |
mov.b64 %rd551, {%r324, %r323}; | |
ld.local.u64 %rd552, [%rd11]; | |
add.s64 %rd553, %rd552, %rd492; | |
add.s64 %rd554, %rd553, %rd515; | |
xor.b64 %rd555, %rd554, %rd548; | |
mov.b64 {%r325, %r326}, %rd555; | |
mov.b64 %rd556, {%r326, %r325}; | |
add.s64 %rd557, %rd556, %rd531; | |
xor.b64 %rd558, %rd557, %rd515; | |
mov.b64 {%r327, %r328}, %rd558; | |
shr.u32 %r329, %r328, 24; | |
shl.b32 %r330, %r327, 8; | |
shr.u32 %r331, %r327, 24; | |
shl.b32 %r332, %r328, 8; | |
or.b32 %r333, %r329, %r330; | |
or.b32 %r334, %r331, %r332; | |
mov.b64 %rd559, {%r334, %r333}; | |
ld.local.u64 %rd560, [%rd12]; | |
add.s64 %rd561, %rd554, %rd560; | |
add.s64 %rd562, %rd561, %rd559; | |
xor.b64 %rd563, %rd562, %rd556; | |
mov.b64 {%r335, %r336}, %rd563; | |
shr.u32 %r337, %r336, 16; | |
shl.b32 %r338, %r335, 16; | |
shr.u32 %r339, %r335, 16; | |
shl.b32 %r340, %r336, 16; | |
or.b32 %r341, %r337, %r338; | |
or.b32 %r342, %r339, %r340; | |
mov.b64 %rd564, {%r342, %r341}; | |
add.s64 %rd565, %rd564, %rd557; | |
xor.b64 %rd566, %rd565, %rd559; | |
mov.b64 {%r343, %r344}, %rd566; | |
shr.u32 %r345, %r343, 31; | |
shl.b32 %r346, %r344, 1; | |
shr.u32 %r347, %r344, 31; | |
shl.b32 %r348, %r343, 1; | |
or.b32 %r349, %r345, %r346; | |
or.b32 %r350, %r347, %r348; | |
mov.b64 %rd567, {%r350, %r349}; | |
ld.local.u64 %rd568, [%rd13]; | |
add.s64 %rd569, %rd568, %rd510; | |
add.s64 %rd570, %rd569, %rd533; | |
xor.b64 %rd571, %rd570, %rd494; | |
mov.b64 {%r351, %r352}, %rd571; | |
mov.b64 %rd572, {%r352, %r351}; | |
add.s64 %rd573, %rd572, %rd549; | |
xor.b64 %rd574, %rd573, %rd533; | |
mov.b64 {%r353, %r354}, %rd574; | |
shr.u32 %r355, %r354, 24; | |
shl.b32 %r356, %r353, 8; | |
shr.u32 %r357, %r353, 24; | |
shl.b32 %r358, %r354, 8; | |
or.b32 %r359, %r355, %r356; | |
or.b32 %r360, %r357, %r358; | |
mov.b64 %rd575, {%r360, %r359}; | |
ld.local.u64 %rd576, [%rd14]; | |
add.s64 %rd577, %rd570, %rd576; | |
add.s64 %rd578, %rd577, %rd575; | |
xor.b64 %rd579, %rd578, %rd572; | |
mov.b64 {%r361, %r362}, %rd579; | |
shr.u32 %r363, %r362, 16; | |
shl.b32 %r364, %r361, 16; | |
shr.u32 %r365, %r361, 16; | |
shl.b32 %r366, %r362, 16; | |
or.b32 %r367, %r363, %r364; | |
or.b32 %r368, %r365, %r366; | |
mov.b64 %rd580, {%r368, %r367}; | |
add.s64 %rd581, %rd580, %rd573; | |
xor.b64 %rd582, %rd581, %rd575; | |
mov.b64 {%r369, %r370}, %rd582; | |
shr.u32 %r371, %r369, 31; | |
shl.b32 %r372, %r370, 1; | |
shr.u32 %r373, %r370, 31; | |
shl.b32 %r374, %r369, 1; | |
or.b32 %r375, %r371, %r372; | |
or.b32 %r376, %r373, %r374; | |
mov.b64 %rd583, {%r376, %r375}; | |
ld.local.u64 %rd584, [%rd15]; | |
add.s64 %rd585, %rd584, %rd528; | |
add.s64 %rd586, %rd585, %rd551; | |
xor.b64 %rd587, %rd586, %rd512; | |
mov.b64 {%r377, %r378}, %rd587; | |
mov.b64 %rd588, {%r378, %r377}; | |
add.s64 %rd589, %rd588, %rd495; | |
xor.b64 %rd590, %rd589, %rd551; | |
mov.b64 {%r379, %r380}, %rd590; | |
shr.u32 %r381, %r380, 24; | |
shl.b32 %r382, %r379, 8; | |
shr.u32 %r383, %r379, 24; | |
shl.b32 %r384, %r380, 8; | |
or.b32 %r385, %r381, %r382; | |
or.b32 %r386, %r383, %r384; | |
mov.b64 %rd591, {%r386, %r385}; | |
ld.local.u64 %rd592, [%rd16]; | |
add.s64 %rd593, %rd586, %rd592; | |
add.s64 %rd594, %rd593, %rd591; | |
xor.b64 %rd595, %rd594, %rd588; | |
mov.b64 {%r387, %r388}, %rd595; | |
shr.u32 %r389, %r388, 16; | |
shl.b32 %r390, %r387, 16; | |
shr.u32 %r391, %r387, 16; | |
shl.b32 %r392, %r388, 16; | |
or.b32 %r393, %r389, %r390; | |
or.b32 %r394, %r391, %r392; | |
mov.b64 %rd596, {%r394, %r393}; | |
add.s64 %rd597, %rd596, %rd589; | |
xor.b64 %rd598, %rd597, %rd591; | |
mov.b64 {%r395, %r396}, %rd598; | |
shr.u32 %r397, %r395, 31; | |
shl.b32 %r398, %r396, 1; | |
shr.u32 %r399, %r396, 31; | |
shl.b32 %r400, %r395, 1; | |
or.b32 %r401, %r397, %r398; | |
or.b32 %r402, %r399, %r400; | |
mov.b64 %rd599, {%r402, %r401}; | |
ld.local.u64 %rd600, [%rd17]; | |
add.s64 %rd601, %rd600, %rd546; | |
add.s64 %rd602, %rd601, %rd497; | |
xor.b64 %rd603, %rd602, %rd530; | |
mov.b64 {%r403, %r404}, %rd603; | |
mov.b64 %rd604, {%r404, %r403}; | |
add.s64 %rd605, %rd604, %rd513; | |
xor.b64 %rd606, %rd605, %rd497; | |
mov.b64 {%r405, %r406}, %rd606; | |
shr.u32 %r407, %r406, 24; | |
shl.b32 %r408, %r405, 8; | |
shr.u32 %r409, %r405, 24; | |
shl.b32 %r410, %r406, 8; | |
or.b32 %r411, %r407, %r408; | |
or.b32 %r412, %r409, %r410; | |
mov.b64 %rd607, {%r412, %r411}; | |
ld.local.u64 %rd608, [%rd18]; | |
add.s64 %rd609, %rd602, %rd608; | |
add.s64 %rd610, %rd609, %rd607; | |
xor.b64 %rd611, %rd610, %rd604; | |
mov.b64 {%r413, %r414}, %rd611; | |
shr.u32 %r415, %r414, 16; | |
shl.b32 %r416, %r413, 16; | |
shr.u32 %r417, %r413, 16; | |
shl.b32 %r418, %r414, 16; | |
or.b32 %r419, %r415, %r416; | |
or.b32 %r420, %r417, %r418; | |
mov.b64 %rd612, {%r420, %r419}; | |
add.s64 %rd613, %rd612, %rd605; | |
xor.b64 %rd614, %rd613, %rd607; | |
mov.b64 {%r421, %r422}, %rd614; | |
shr.u32 %r423, %r421, 31; | |
shl.b32 %r424, %r422, 1; | |
shr.u32 %r425, %r422, 31; | |
shl.b32 %r426, %r421, 1; | |
or.b32 %r427, %r423, %r424; | |
or.b32 %r428, %r425, %r426; | |
mov.b64 %rd615, {%r428, %r427}; | |
ld.local.u64 %rd616, [%rd19]; | |
add.s64 %rd617, %rd562, %rd616; | |
add.s64 %rd618, %rd617, %rd615; | |
xor.b64 %rd619, %rd618, %rd580; | |
mov.b64 {%r429, %r430}, %rd619; | |
mov.b64 %rd620, {%r430, %r429}; | |
add.s64 %rd621, %rd620, %rd597; | |
xor.b64 %rd622, %rd621, %rd615; | |
mov.b64 {%r431, %r432}, %rd622; | |
shr.u32 %r433, %r432, 24; | |
shl.b32 %r434, %r431, 8; | |
shr.u32 %r435, %r431, 24; | |
shl.b32 %r436, %r432, 8; | |
or.b32 %r437, %r433, %r434; | |
or.b32 %r438, %r435, %r436; | |
mov.b64 %rd623, {%r438, %r437}; | |
ld.local.u64 %rd624, [%rd20]; | |
add.s64 %rd625, %rd618, %rd624; | |
add.s64 %rd626, %rd625, %rd623; | |
xor.b64 %rd627, %rd626, %rd620; | |
mov.b64 {%r439, %r440}, %rd627; | |
shr.u32 %r441, %r440, 16; | |
shl.b32 %r442, %r439, 16; | |
shr.u32 %r443, %r439, 16; | |
shl.b32 %r444, %r440, 16; | |
or.b32 %r445, %r441, %r442; | |
or.b32 %r446, %r443, %r444; | |
mov.b64 %rd628, {%r446, %r445}; | |
add.s64 %rd629, %rd628, %rd621; | |
xor.b64 %rd630, %rd629, %rd623; | |
mov.b64 {%r447, %r448}, %rd630; | |
shr.u32 %r449, %r447, 31; | |
shl.b32 %r450, %r448, 1; | |
shr.u32 %r451, %r448, 31; | |
shl.b32 %r452, %r447, 1; | |
or.b32 %r453, %r449, %r450; | |
or.b32 %r454, %r451, %r452; | |
mov.b64 %rd631, {%r454, %r453}; | |
ld.local.u64 %rd632, [%rd21]; | |
add.s64 %rd633, %rd578, %rd632; | |
add.s64 %rd634, %rd633, %rd567; | |
xor.b64 %rd635, %rd634, %rd596; | |
mov.b64 {%r455, %r456}, %rd635; | |
mov.b64 %rd636, {%r456, %r455}; | |
add.s64 %rd637, %rd636, %rd613; | |
xor.b64 %rd638, %rd637, %rd567; | |
mov.b64 {%r457, %r458}, %rd638; | |
shr.u32 %r459, %r458, 24; | |
shl.b32 %r460, %r457, 8; | |
shr.u32 %r461, %r457, 24; | |
shl.b32 %r462, %r458, 8; | |
or.b32 %r463, %r459, %r460; | |
or.b32 %r464, %r461, %r462; | |
mov.b64 %rd639, {%r464, %r463}; | |
ld.local.u64 %rd640, [%rd22]; | |
add.s64 %rd641, %rd634, %rd640; | |
add.s64 %rd642, %rd641, %rd639; | |
xor.b64 %rd643, %rd642, %rd636; | |
mov.b64 {%r465, %r466}, %rd643; | |
shr.u32 %r467, %r466, 16; | |
shl.b32 %r468, %r465, 16; | |
shr.u32 %r469, %r465, 16; | |
shl.b32 %r470, %r466, 16; | |
or.b32 %r471, %r467, %r468; | |
or.b32 %r472, %r469, %r470; | |
mov.b64 %rd644, {%r472, %r471}; | |
add.s64 %rd645, %rd644, %rd637; | |
xor.b64 %rd646, %rd645, %rd639; | |
mov.b64 {%r473, %r474}, %rd646; | |
shr.u32 %r475, %r473, 31; | |
shl.b32 %r476, %r474, 1; | |
shr.u32 %r477, %r474, 31; | |
shl.b32 %r478, %r473, 1; | |
or.b32 %r479, %r475, %r476; | |
or.b32 %r480, %r477, %r478; | |
mov.b64 %rd647, {%r480, %r479}; | |
ld.local.u64 %rd648, [%rd23]; | |
add.s64 %rd649, %rd594, %rd648; | |
add.s64 %rd650, %rd649, %rd583; | |
xor.b64 %rd651, %rd650, %rd612; | |
mov.b64 {%r481, %r482}, %rd651; | |
mov.b64 %rd652, {%r482, %r481}; | |
add.s64 %rd653, %rd652, %rd565; | |
xor.b64 %rd654, %rd653, %rd583; | |
mov.b64 {%r483, %r484}, %rd654; | |
shr.u32 %r485, %r484, 24; | |
shl.b32 %r486, %r483, 8; | |
shr.u32 %r487, %r483, 24; | |
shl.b32 %r488, %r484, 8; | |
or.b32 %r489, %r485, %r486; | |
or.b32 %r490, %r487, %r488; | |
mov.b64 %rd655, {%r490, %r489}; | |
ld.local.u64 %rd656, [%rd24]; | |
add.s64 %rd657, %rd650, %rd656; | |
add.s64 %rd658, %rd657, %rd655; | |
xor.b64 %rd659, %rd658, %rd652; | |
mov.b64 {%r491, %r492}, %rd659; | |
shr.u32 %r493, %r492, 16; | |
shl.b32 %r494, %r491, 16; | |
shr.u32 %r495, %r491, 16; | |
shl.b32 %r496, %r492, 16; | |
or.b32 %r497, %r493, %r494; | |
or.b32 %r498, %r495, %r496; | |
mov.b64 %rd660, {%r498, %r497}; | |
add.s64 %rd661, %rd660, %rd653; | |
xor.b64 %rd662, %rd661, %rd655; | |
mov.b64 {%r499, %r500}, %rd662; | |
shr.u32 %r501, %r499, 31; | |
shl.b32 %r502, %r500, 1; | |
shr.u32 %r503, %r500, 31; | |
shl.b32 %r504, %r499, 1; | |
or.b32 %r505, %r501, %r502; | |
or.b32 %r506, %r503, %r504; | |
mov.b64 %rd663, {%r506, %r505}; | |
ld.local.u64 %rd664, [%rd25]; | |
add.s64 %rd665, %rd610, %rd664; | |
add.s64 %rd666, %rd665, %rd599; | |
xor.b64 %rd667, %rd666, %rd564; | |
mov.b64 {%r507, %r508}, %rd667; | |
mov.b64 %rd668, {%r508, %r507}; | |
add.s64 %rd669, %rd668, %rd581; | |
xor.b64 %rd670, %rd669, %rd599; | |
mov.b64 {%r509, %r510}, %rd670; | |
shr.u32 %r511, %r510, 24; | |
shl.b32 %r512, %r509, 8; | |
shr.u32 %r513, %r509, 24; | |
shl.b32 %r514, %r510, 8; | |
or.b32 %r515, %r511, %r512; | |
or.b32 %r516, %r513, %r514; | |
mov.b64 %rd671, {%r516, %r515}; | |
ld.local.u64 %rd672, [%rd26]; | |
add.s64 %rd673, %rd666, %rd672; | |
add.s64 %rd674, %rd673, %rd671; | |
xor.b64 %rd675, %rd674, %rd668; | |
mov.b64 {%r517, %r518}, %rd675; | |
shr.u32 %r519, %r518, 16; | |
shl.b32 %r520, %r517, 16; | |
shr.u32 %r521, %r517, 16; | |
shl.b32 %r522, %r518, 16; | |
or.b32 %r523, %r519, %r520; | |
or.b32 %r524, %r521, %r522; | |
mov.b64 %rd676, {%r524, %r523}; | |
add.s64 %rd677, %rd676, %rd669; | |
xor.b64 %rd678, %rd677, %rd671; | |
mov.b64 {%r525, %r526}, %rd678; | |
shr.u32 %r527, %r525, 31; | |
shl.b32 %r528, %r526, 1; | |
shr.u32 %r529, %r526, 31; | |
shl.b32 %r530, %r525, 1; | |
or.b32 %r531, %r527, %r528; | |
or.b32 %r532, %r529, %r530; | |
mov.b64 %rd679, {%r532, %r531}; | |
ld.local.u64 %rd680, [%rd27]; | |
add.s64 %rd681, %rd626, %rd680; | |
add.s64 %rd682, %rd681, %rd647; | |
xor.b64 %rd683, %rd682, %rd676; | |
mov.b64 {%r533, %r534}, %rd683; | |
mov.b64 %rd684, {%r534, %r533}; | |
add.s64 %rd685, %rd684, %rd661; | |
xor.b64 %rd686, %rd685, %rd647; | |
mov.b64 {%r535, %r536}, %rd686; | |
shr.u32 %r537, %r536, 24; | |
shl.b32 %r538, %r535, 8; | |
shr.u32 %r539, %r535, 24; | |
shl.b32 %r540, %r536, 8; | |
or.b32 %r541, %r537, %r538; | |
or.b32 %r542, %r539, %r540; | |
mov.b64 %rd687, {%r542, %r541}; | |
ld.local.u64 %rd688, [%rd28]; | |
add.s64 %rd689, %rd682, %rd688; | |
add.s64 %rd690, %rd689, %rd687; | |
xor.b64 %rd691, %rd690, %rd684; | |
mov.b64 {%r543, %r544}, %rd691; | |
shr.u32 %r545, %r544, 16; | |
shl.b32 %r546, %r543, 16; | |
shr.u32 %r547, %r543, 16; | |
shl.b32 %r548, %r544, 16; | |
or.b32 %r549, %r545, %r546; | |
or.b32 %r550, %r547, %r548; | |
mov.b64 %rd692, {%r550, %r549}; | |
add.s64 %rd693, %rd692, %rd685; | |
xor.b64 %rd694, %rd693, %rd687; | |
mov.b64 {%r551, %r552}, %rd694; | |
shr.u32 %r553, %r551, 31; | |
shl.b32 %r554, %r552, 1; | |
shr.u32 %r555, %r552, 31; | |
shl.b32 %r556, %r551, 1; | |
or.b32 %r557, %r553, %r554; | |
or.b32 %r558, %r555, %r556; | |
mov.b64 %rd695, {%r558, %r557}; | |
ld.local.u64 %rd696, [%rd29]; | |
add.s64 %rd697, %rd642, %rd696; | |
add.s64 %rd698, %rd697, %rd663; | |
xor.b64 %rd699, %rd698, %rd628; | |
mov.b64 {%r559, %r560}, %rd699; | |
mov.b64 %rd700, {%r560, %r559}; | |
add.s64 %rd701, %rd700, %rd677; | |
xor.b64 %rd702, %rd701, %rd663; | |
mov.b64 {%r561, %r562}, %rd702; | |
shr.u32 %r563, %r562, 24; | |
shl.b32 %r564, %r561, 8; | |
shr.u32 %r565, %r561, 24; | |
shl.b32 %r566, %r562, 8; | |
or.b32 %r567, %r563, %r564; | |
or.b32 %r568, %r565, %r566; | |
mov.b64 %rd703, {%r568, %r567}; | |
ld.local.u64 %rd704, [%rd30]; | |
add.s64 %rd705, %rd698, %rd704; | |
add.s64 %rd706, %rd705, %rd703; | |
xor.b64 %rd707, %rd706, %rd700; | |
mov.b64 {%r569, %r570}, %rd707; | |
shr.u32 %r571, %r570, 16; | |
shl.b32 %r572, %r569, 16; | |
shr.u32 %r573, %r569, 16; | |
shl.b32 %r574, %r570, 16; | |
or.b32 %r575, %r571, %r572; | |
or.b32 %r576, %r573, %r574; | |
mov.b64 %rd708, {%r576, %r575}; | |
add.s64 %rd709, %rd708, %rd701; | |
xor.b64 %rd710, %rd709, %rd703; | |
mov.b64 {%r577, %r578}, %rd710; | |
shr.u32 %r579, %r577, 31; | |
shl.b32 %r580, %r578, 1; | |
shr.u32 %r581, %r578, 31; | |
shl.b32 %r582, %r577, 1; | |
or.b32 %r583, %r579, %r580; | |
or.b32 %r584, %r581, %r582; | |
mov.b64 %rd711, {%r584, %r583}; | |
ld.local.u64 %rd712, [%rd31]; | |
add.s64 %rd713, %rd658, %rd712; | |
add.s64 %rd714, %rd713, %rd679; | |
xor.b64 %rd715, %rd714, %rd644; | |
mov.b64 {%r585, %r586}, %rd715; | |
mov.b64 %rd716, {%r586, %r585}; | |
add.s64 %rd717, %rd716, %rd629; | |
xor.b64 %rd718, %rd717, %rd679; | |
mov.b64 {%r587, %r588}, %rd718; | |
shr.u32 %r589, %r588, 24; | |
shl.b32 %r590, %r587, 8; | |
shr.u32 %r591, %r587, 24; | |
shl.b32 %r592, %r588, 8; | |
or.b32 %r593, %r589, %r590; | |
or.b32 %r594, %r591, %r592; | |
mov.b64 %rd719, {%r594, %r593}; | |
ld.local.u64 %rd720, [%rd32]; | |
add.s64 %rd721, %rd714, %rd720; | |
add.s64 %rd722, %rd721, %rd719; | |
xor.b64 %rd723, %rd722, %rd716; | |
mov.b64 {%r595, %r596}, %rd723; | |
shr.u32 %r597, %r596, 16; | |
shl.b32 %r598, %r595, 16; | |
shr.u32 %r599, %r595, 16; | |
shl.b32 %r600, %r596, 16; | |
or.b32 %r601, %r597, %r598; | |
or.b32 %r602, %r599, %r600; | |
mov.b64 %rd724, {%r602, %r601}; | |
add.s64 %rd725, %rd724, %rd717; | |
xor.b64 %rd726, %rd725, %rd719; | |
mov.b64 {%r603, %r604}, %rd726; | |
shr.u32 %r605, %r603, 31; | |
shl.b32 %r606, %r604, 1; | |
shr.u32 %r607, %r604, 31; | |
shl.b32 %r608, %r603, 1; | |
or.b32 %r609, %r605, %r606; | |
or.b32 %r610, %r607, %r608; | |
mov.b64 %rd727, {%r610, %r609}; | |
ld.local.u64 %rd728, [%rd33]; | |
add.s64 %rd729, %rd674, %rd728; | |
add.s64 %rd730, %rd729, %rd631; | |
xor.b64 %rd731, %rd730, %rd660; | |
mov.b64 {%r611, %r612}, %rd731; | |
mov.b64 %rd732, {%r612, %r611}; | |
add.s64 %rd733, %rd732, %rd645; | |
xor.b64 %rd734, %rd733, %rd631; | |
mov.b64 {%r613, %r614}, %rd734; | |
shr.u32 %r615, %r614, 24; | |
shl.b32 %r616, %r613, 8; | |
shr.u32 %r617, %r613, 24; | |
shl.b32 %r618, %r614, 8; | |
or.b32 %r619, %r615, %r616; | |
or.b32 %r620, %r617, %r618; | |
mov.b64 %rd735, {%r620, %r619}; | |
ld.local.u64 %rd736, [%rd34]; | |
add.s64 %rd737, %rd730, %rd736; | |
add.s64 %rd738, %rd737, %rd735; | |
xor.b64 %rd739, %rd738, %rd732; | |
mov.b64 {%r621, %r622}, %rd739; | |
shr.u32 %r623, %r622, 16; | |
shl.b32 %r624, %r621, 16; | |
shr.u32 %r625, %r621, 16; | |
shl.b32 %r626, %r622, 16; | |
or.b32 %r627, %r623, %r624; | |
or.b32 %r628, %r625, %r626; | |
mov.b64 %rd740, {%r628, %r627}; | |
add.s64 %rd741, %rd740, %rd733; | |
xor.b64 %rd742, %rd741, %rd735; | |
mov.b64 {%r629, %r630}, %rd742; | |
shr.u32 %r631, %r629, 31; | |
shl.b32 %r632, %r630, 1; | |
shr.u32 %r633, %r630, 31; | |
shl.b32 %r634, %r629, 1; | |
or.b32 %r635, %r631, %r632; | |
or.b32 %r636, %r633, %r634; | |
mov.b64 %rd743, {%r636, %r635}; | |
ld.local.u64 %rd744, [%rd35]; | |
add.s64 %rd745, %rd690, %rd744; | |
add.s64 %rd746, %rd745, %rd743; | |
xor.b64 %rd747, %rd746, %rd708; | |
mov.b64 {%r637, %r638}, %rd747; | |
mov.b64 %rd748, {%r638, %r637}; | |
add.s64 %rd749, %rd748, %rd725; | |
xor.b64 %rd750, %rd749, %rd743; | |
mov.b64 {%r639, %r640}, %rd750; | |
shr.u32 %r641, %r640, 24; | |
shl.b32 %r642, %r639, 8; | |
shr.u32 %r643, %r639, 24; | |
shl.b32 %r644, %r640, 8; | |
or.b32 %r645, %r641, %r642; | |
or.b32 %r646, %r643, %r644; | |
mov.b64 %rd751, {%r646, %r645}; | |
ld.local.u64 %rd752, [%rd36]; | |
add.s64 %rd753, %rd746, %rd752; | |
add.s64 %rd754, %rd753, %rd751; | |
xor.b64 %rd755, %rd754, %rd748; | |
mov.b64 {%r647, %r648}, %rd755; | |
shr.u32 %r649, %r648, 16; | |
shl.b32 %r650, %r647, 16; | |
shr.u32 %r651, %r647, 16; | |
shl.b32 %r652, %r648, 16; | |
or.b32 %r653, %r649, %r650; | |
or.b32 %r654, %r651, %r652; | |
mov.b64 %rd756, {%r654, %r653}; | |
add.s64 %rd757, %rd756, %rd749; | |
xor.b64 %rd758, %rd757, %rd751; | |
mov.b64 {%r655, %r656}, %rd758; | |
shr.u32 %r657, %r655, 31; | |
shl.b32 %r658, %r656, 1; | |
shr.u32 %r659, %r656, 31; | |
shl.b32 %r660, %r655, 1; | |
or.b32 %r661, %r657, %r658; | |
or.b32 %r662, %r659, %r660; | |
mov.b64 %rd759, {%r662, %r661}; | |
ld.local.u64 %rd760, [%rd37]; | |
add.s64 %rd761, %rd706, %rd760; | |
add.s64 %rd762, %rd761, %rd695; | |
xor.b64 %rd763, %rd762, %rd724; | |
mov.b64 {%r663, %r664}, %rd763; | |
mov.b64 %rd764, {%r664, %r663}; | |
add.s64 %rd765, %rd764, %rd741; | |
xor.b64 %rd766, %rd765, %rd695; | |
mov.b64 {%r665, %r666}, %rd766; | |
shr.u32 %r667, %r666, 24; | |
shl.b32 %r668, %r665, 8; | |
shr.u32 %r669, %r665, 24; | |
shl.b32 %r670, %r666, 8; | |
or.b32 %r671, %r667, %r668; | |
or.b32 %r672, %r669, %r670; | |
mov.b64 %rd767, {%r672, %r671}; | |
ld.local.u64 %rd768, [%rd38]; | |
add.s64 %rd769, %rd762, %rd768; | |
add.s64 %rd770, %rd769, %rd767; | |
xor.b64 %rd771, %rd770, %rd764; | |
mov.b64 {%r673, %r674}, %rd771; | |
shr.u32 %r675, %r674, 16; | |
shl.b32 %r676, %r673, 16; | |
shr.u32 %r677, %r673, 16; | |
shl.b32 %r678, %r674, 16; | |
or.b32 %r679, %r675, %r676; | |
or.b32 %r680, %r677, %r678; | |
mov.b64 %rd772, {%r680, %r679}; | |
add.s64 %rd773, %rd772, %rd765; | |
xor.b64 %rd774, %rd773, %rd767; | |
mov.b64 {%r681, %r682}, %rd774; | |
shr.u32 %r683, %r681, 31; | |
shl.b32 %r684, %r682, 1; | |
shr.u32 %r685, %r682, 31; | |
shl.b32 %r686, %r681, 1; | |
or.b32 %r687, %r683, %r684; | |
or.b32 %r688, %r685, %r686; | |
mov.b64 %rd775, {%r688, %r687}; | |
ld.local.u64 %rd776, [%rd39]; | |
add.s64 %rd777, %rd722, %rd776; | |
add.s64 %rd778, %rd777, %rd711; | |
xor.b64 %rd779, %rd778, %rd740; | |
mov.b64 {%r689, %r690}, %rd779; | |
mov.b64 %rd780, {%r690, %r689}; | |
add.s64 %rd781, %rd780, %rd693; | |
xor.b64 %rd782, %rd781, %rd711; | |
mov.b64 {%r691, %r692}, %rd782; | |
shr.u32 %r693, %r692, 24; | |
shl.b32 %r694, %r691, 8; | |
shr.u32 %r695, %r691, 24; | |
shl.b32 %r696, %r692, 8; | |
or.b32 %r697, %r693, %r694; | |
or.b32 %r698, %r695, %r696; | |
mov.b64 %rd783, {%r698, %r697}; | |
ld.local.u64 %rd784, [%rd40]; | |
add.s64 %rd785, %rd778, %rd784; | |
add.s64 %rd786, %rd785, %rd783; | |
xor.b64 %rd787, %rd786, %rd780; | |
mov.b64 {%r699, %r700}, %rd787; | |
shr.u32 %r701, %r700, 16; | |
shl.b32 %r702, %r699, 16; | |
shr.u32 %r703, %r699, 16; | |
shl.b32 %r704, %r700, 16; | |
or.b32 %r705, %r701, %r702; | |
or.b32 %r706, %r703, %r704; | |
mov.b64 %rd788, {%r706, %r705}; | |
add.s64 %rd789, %rd788, %rd781; | |
xor.b64 %rd790, %rd789, %rd783; | |
mov.b64 {%r707, %r708}, %rd790; | |
shr.u32 %r709, %r707, 31; | |
shl.b32 %r710, %r708, 1; | |
shr.u32 %r711, %r708, 31; | |
shl.b32 %r712, %r707, 1; | |
or.b32 %r713, %r709, %r710; | |
or.b32 %r714, %r711, %r712; | |
mov.b64 %rd791, {%r714, %r713}; | |
ld.local.u64 %rd792, [%rd41]; | |
add.s64 %rd793, %rd738, %rd792; | |
add.s64 %rd794, %rd793, %rd727; | |
xor.b64 %rd795, %rd794, %rd692; | |
mov.b64 {%r715, %r716}, %rd795; | |
mov.b64 %rd796, {%r716, %r715}; | |
add.s64 %rd797, %rd796, %rd709; | |
xor.b64 %rd798, %rd797, %rd727; | |
mov.b64 {%r717, %r718}, %rd798; | |
shr.u32 %r719, %r718, 24; | |
shl.b32 %r720, %r717, 8; | |
shr.u32 %r721, %r717, 24; | |
shl.b32 %r722, %r718, 8; | |
or.b32 %r723, %r719, %r720; | |
or.b32 %r724, %r721, %r722; | |
mov.b64 %rd799, {%r724, %r723}; | |
ld.local.u64 %rd800, [%rd42]; | |
add.s64 %rd801, %rd794, %rd800; | |
add.s64 %rd802, %rd801, %rd799; | |
xor.b64 %rd803, %rd802, %rd796; | |
mov.b64 {%r725, %r726}, %rd803; | |
shr.u32 %r727, %r726, 16; | |
shl.b32 %r728, %r725, 16; | |
shr.u32 %r729, %r725, 16; | |
shl.b32 %r730, %r726, 16; | |
or.b32 %r731, %r727, %r728; | |
or.b32 %r732, %r729, %r730; | |
mov.b64 %rd804, {%r732, %r731}; | |
add.s64 %rd805, %rd804, %rd797; | |
xor.b64 %rd806, %rd805, %rd799; | |
mov.b64 {%r733, %r734}, %rd806; | |
shr.u32 %r735, %r733, 31; | |
shl.b32 %r736, %r734, 1; | |
shr.u32 %r737, %r734, 31; | |
shl.b32 %r738, %r733, 1; | |
or.b32 %r739, %r735, %r736; | |
or.b32 %r740, %r737, %r738; | |
mov.b64 %rd807, {%r740, %r739}; | |
ld.local.u64 %rd808, [%rd43]; | |
add.s64 %rd809, %rd754, %rd808; | |
add.s64 %rd810, %rd809, %rd775; | |
xor.b64 %rd811, %rd810, %rd804; | |
mov.b64 {%r741, %r742}, %rd811; | |
mov.b64 %rd812, {%r742, %r741}; | |
add.s64 %rd813, %rd812, %rd789; | |
xor.b64 %rd814, %rd813, %rd775; | |
mov.b64 {%r743, %r744}, %rd814; | |
shr.u32 %r745, %r744, 24; | |
shl.b32 %r746, %r743, 8; | |
shr.u32 %r747, %r743, 24; | |
shl.b32 %r748, %r744, 8; | |
or.b32 %r749, %r745, %r746; | |
or.b32 %r750, %r747, %r748; | |
mov.b64 %rd815, {%r750, %r749}; | |
ld.local.u64 %rd816, [%rd44]; | |
add.s64 %rd817, %rd810, %rd816; | |
add.s64 %rd818, %rd817, %rd815; | |
xor.b64 %rd819, %rd818, %rd812; | |
mov.b64 {%r751, %r752}, %rd819; | |
shr.u32 %r753, %r752, 16; | |
shl.b32 %r754, %r751, 16; | |
shr.u32 %r755, %r751, 16; | |
shl.b32 %r756, %r752, 16; | |
or.b32 %r757, %r753, %r754; | |
or.b32 %r758, %r755, %r756; | |
mov.b64 %rd820, {%r758, %r757}; | |
add.s64 %rd821, %rd820, %rd813; | |
xor.b64 %rd822, %rd821, %rd815; | |
mov.b64 {%r759, %r760}, %rd822; | |
shr.u32 %r761, %r759, 31; | |
shl.b32 %r762, %r760, 1; | |
shr.u32 %r763, %r760, 31; | |
shl.b32 %r764, %r759, 1; | |
or.b32 %r765, %r761, %r762; | |
or.b32 %r766, %r763, %r764; | |
mov.b64 %rd823, {%r766, %r765}; | |
ld.local.u64 %rd824, [%rd45]; | |
add.s64 %rd825, %rd770, %rd824; | |
add.s64 %rd826, %rd825, %rd791; | |
xor.b64 %rd827, %rd826, %rd756; | |
mov.b64 {%r767, %r768}, %rd827; | |
mov.b64 %rd828, {%r768, %r767}; | |
add.s64 %rd829, %rd828, %rd805; | |
xor.b64 %rd830, %rd829, %rd791; | |
mov.b64 {%r769, %r770}, %rd830; | |
shr.u32 %r771, %r770, 24; | |
shl.b32 %r772, %r769, 8; | |
shr.u32 %r773, %r769, 24; | |
shl.b32 %r774, %r770, 8; | |
or.b32 %r775, %r771, %r772; | |
or.b32 %r776, %r773, %r774; | |
mov.b64 %rd831, {%r776, %r775}; | |
ld.local.u64 %rd832, [%rd46]; | |
add.s64 %rd833, %rd826, %rd832; | |
add.s64 %rd834, %rd833, %rd831; | |
xor.b64 %rd835, %rd834, %rd828; | |
mov.b64 {%r777, %r778}, %rd835; | |
shr.u32 %r779, %r778, 16; | |
shl.b32 %r780, %r777, 16; | |
shr.u32 %r781, %r777, 16; | |
shl.b32 %r782, %r778, 16; | |
or.b32 %r783, %r779, %r780; | |
or.b32 %r784, %r781, %r782; | |
mov.b64 %rd836, {%r784, %r783}; | |
add.s64 %rd837, %rd836, %rd829; | |
xor.b64 %rd838, %rd837, %rd831; | |
mov.b64 {%r785, %r786}, %rd838; | |
shr.u32 %r787, %r785, 31; | |
shl.b32 %r788, %r786, 1; | |
shr.u32 %r789, %r786, 31; | |
shl.b32 %r790, %r785, 1; | |
or.b32 %r791, %r787, %r788; | |
or.b32 %r792, %r789, %r790; | |
mov.b64 %rd839, {%r792, %r791}; | |
ld.local.u64 %rd840, [%rd47]; | |
add.s64 %rd841, %rd786, %rd840; | |
add.s64 %rd842, %rd841, %rd807; | |
xor.b64 %rd843, %rd842, %rd772; | |
mov.b64 {%r793, %r794}, %rd843; | |
mov.b64 %rd844, {%r794, %r793}; | |
add.s64 %rd845, %rd844, %rd757; | |
xor.b64 %rd846, %rd845, %rd807; | |
mov.b64 {%r795, %r796}, %rd846; | |
shr.u32 %r797, %r796, 24; | |
shl.b32 %r798, %r795, 8; | |
shr.u32 %r799, %r795, 24; | |
shl.b32 %r800, %r796, 8; | |
or.b32 %r801, %r797, %r798; | |
or.b32 %r802, %r799, %r800; | |
mov.b64 %rd847, {%r802, %r801}; | |
ld.local.u64 %rd848, [%rd48]; | |
add.s64 %rd849, %rd842, %rd848; | |
add.s64 %rd850, %rd849, %rd847; | |
xor.b64 %rd851, %rd850, %rd844; | |
mov.b64 {%r803, %r804}, %rd851; | |
shr.u32 %r805, %r804, 16; | |
shl.b32 %r806, %r803, 16; | |
shr.u32 %r807, %r803, 16; | |
shl.b32 %r808, %r804, 16; | |
or.b32 %r809, %r805, %r806; | |
or.b32 %r810, %r807, %r808; | |
mov.b64 %rd852, {%r810, %r809}; | |
add.s64 %rd853, %rd852, %rd845; | |
xor.b64 %rd854, %rd853, %rd847; | |
mov.b64 {%r811, %r812}, %rd854; | |
shr.u32 %r813, %r811, 31; | |
shl.b32 %r814, %r812, 1; | |
shr.u32 %r815, %r812, 31; | |
shl.b32 %r816, %r811, 1; | |
or.b32 %r817, %r813, %r814; | |
or.b32 %r818, %r815, %r816; | |
mov.b64 %rd855, {%r818, %r817}; | |
ld.local.u64 %rd856, [%rd49]; | |
add.s64 %rd857, %rd802, %rd856; | |
add.s64 %rd858, %rd857, %rd759; | |
xor.b64 %rd859, %rd858, %rd788; | |
mov.b64 {%r819, %r820}, %rd859; | |
mov.b64 %rd860, {%r820, %r819}; | |
add.s64 %rd861, %rd860, %rd773; | |
xor.b64 %rd862, %rd861, %rd759; | |
mov.b64 {%r821, %r822}, %rd862; | |
shr.u32 %r823, %r822, 24; | |
shl.b32 %r824, %r821, 8; | |
shr.u32 %r825, %r821, 24; | |
shl.b32 %r826, %r822, 8; | |
or.b32 %r827, %r823, %r824; | |
or.b32 %r828, %r825, %r826; | |
mov.b64 %rd863, {%r828, %r827}; | |
ld.local.u64 %rd864, [%rd50]; | |
add.s64 %rd865, %rd858, %rd864; | |
add.s64 %rd866, %rd865, %rd863; | |
xor.b64 %rd867, %rd866, %rd860; | |
mov.b64 {%r829, %r830}, %rd867; | |
shr.u32 %r831, %r830, 16; | |
shl.b32 %r832, %r829, 16; | |
shr.u32 %r833, %r829, 16; | |
shl.b32 %r834, %r830, 16; | |
or.b32 %r835, %r831, %r832; | |
or.b32 %r836, %r833, %r834; | |
mov.b64 %rd868, {%r836, %r835}; | |
add.s64 %rd869, %rd868, %rd861; | |
xor.b64 %rd870, %rd869, %rd863; | |
mov.b64 {%r837, %r838}, %rd870; | |
shr.u32 %r839, %r837, 31; | |
shl.b32 %r840, %r838, 1; | |
shr.u32 %r841, %r838, 31; | |
shl.b32 %r842, %r837, 1; | |
or.b32 %r843, %r839, %r840; | |
or.b32 %r844, %r841, %r842; | |
mov.b64 %rd871, {%r844, %r843}; | |
ld.local.u64 %rd872, [%rd51]; | |
add.s64 %rd873, %rd818, %rd872; | |
add.s64 %rd874, %rd873, %rd871; | |
xor.b64 %rd875, %rd874, %rd836; | |
mov.b64 {%r845, %r846}, %rd875; | |
mov.b64 %rd876, {%r846, %r845}; | |
add.s64 %rd877, %rd876, %rd853; | |
xor.b64 %rd878, %rd877, %rd871; | |
mov.b64 {%r847, %r848}, %rd878; | |
shr.u32 %r849, %r848, 24; | |
shl.b32 %r850, %r847, 8; | |
shr.u32 %r851, %r847, 24; | |
shl.b32 %r852, %r848, 8; | |
or.b32 %r853, %r849, %r850; | |
or.b32 %r854, %r851, %r852; | |
mov.b64 %rd879, {%r854, %r853}; | |
ld.local.u64 %rd880, [%rd52]; | |
add.s64 %rd881, %rd874, %rd880; | |
add.s64 %rd882, %rd881, %rd879; | |
xor.b64 %rd883, %rd882, %rd876; | |
mov.b64 {%r855, %r856}, %rd883; | |
shr.u32 %r857, %r856, 16; | |
shl.b32 %r858, %r855, 16; | |
shr.u32 %r859, %r855, 16; | |
shl.b32 %r860, %r856, 16; | |
or.b32 %r861, %r857, %r858; | |
or.b32 %r862, %r859, %r860; | |
mov.b64 %rd884, {%r862, %r861}; | |
add.s64 %rd885, %rd884, %rd877; | |
xor.b64 %rd886, %rd885, %rd879; | |
mov.b64 {%r863, %r864}, %rd886; | |
shr.u32 %r865, %r863, 31; | |
shl.b32 %r866, %r864, 1; | |
shr.u32 %r867, %r864, 31; | |
shl.b32 %r868, %r863, 1; | |
or.b32 %r869, %r865, %r866; | |
or.b32 %r870, %r867, %r868; | |
mov.b64 %rd887, {%r870, %r869}; | |
ld.local.u64 %rd888, [%rd53]; | |
add.s64 %rd889, %rd834, %rd888; | |
add.s64 %rd890, %rd889, %rd823; | |
xor.b64 %rd891, %rd890, %rd852; | |
mov.b64 {%r871, %r872}, %rd891; | |
mov.b64 %rd892, {%r872, %r871}; | |
add.s64 %rd893, %rd892, %rd869; | |
xor.b64 %rd894, %rd893, %rd823; | |
mov.b64 {%r873, %r874}, %rd894; | |
shr.u32 %r875, %r874, 24; | |
shl.b32 %r876, %r873, 8; | |
shr.u32 %r877, %r873, 24; | |
shl.b32 %r878, %r874, 8; | |
or.b32 %r879, %r875, %r876; | |
or.b32 %r880, %r877, %r878; | |
mov.b64 %rd895, {%r880, %r879}; | |
ld.local.u64 %rd896, [%rd54]; | |
add.s64 %rd897, %rd890, %rd896; | |
add.s64 %rd898, %rd897, %rd895; | |
xor.b64 %rd899, %rd898, %rd892; | |
mov.b64 {%r881, %r882}, %rd899; | |
shr.u32 %r883, %r882, 16; | |
shl.b32 %r884, %r881, 16; | |
shr.u32 %r885, %r881, 16; | |
shl.b32 %r886, %r882, 16; | |
or.b32 %r887, %r883, %r884; | |
or.b32 %r888, %r885, %r886; | |
mov.b64 %rd900, {%r888, %r887}; | |
add.s64 %rd901, %rd900, %rd893; | |
xor.b64 %rd902, %rd901, %rd895; | |
mov.b64 {%r889, %r890}, %rd902; | |
shr.u32 %r891, %r889, 31; | |
shl.b32 %r892, %r890, 1; | |
shr.u32 %r893, %r890, 31; | |
shl.b32 %r894, %r889, 1; | |
or.b32 %r895, %r891, %r892; | |
or.b32 %r896, %r893, %r894; | |
mov.b64 %rd903, {%r896, %r895}; | |
ld.local.u64 %rd904, [%rd55]; | |
add.s64 %rd905, %rd850, %rd904; | |
add.s64 %rd906, %rd905, %rd839; | |
xor.b64 %rd907, %rd906, %rd868; | |
mov.b64 {%r897, %r898}, %rd907; | |
mov.b64 %rd908, {%r898, %r897}; | |
add.s64 %rd909, %rd908, %rd821; | |
xor.b64 %rd910, %rd909, %rd839; | |
mov.b64 {%r899, %r900}, %rd910; | |
shr.u32 %r901, %r900, 24; | |
shl.b32 %r902, %r899, 8; | |
shr.u32 %r903, %r899, 24; | |
shl.b32 %r904, %r900, 8; | |
or.b32 %r905, %r901, %r902; | |
or.b32 %r906, %r903, %r904; | |
mov.b64 %rd911, {%r906, %r905}; | |
ld.local.u64 %rd912, [%rd56]; | |
add.s64 %rd913, %rd906, %rd912; | |
add.s64 %rd914, %rd913, %rd911; | |
xor.b64 %rd915, %rd914, %rd908; | |
mov.b64 {%r907, %r908}, %rd915; | |
shr.u32 %r909, %r908, 16; | |
shl.b32 %r910, %r907, 16; | |
shr.u32 %r911, %r907, 16; | |
shl.b32 %r912, %r908, 16; | |
or.b32 %r913, %r909, %r910; | |
or.b32 %r914, %r911, %r912; | |
mov.b64 %rd916, {%r914, %r913}; | |
add.s64 %rd917, %rd916, %rd909; | |
xor.b64 %rd918, %rd917, %rd911; | |
mov.b64 {%r915, %r916}, %rd918; | |
shr.u32 %r917, %r915, 31; | |
shl.b32 %r918, %r916, 1; | |
shr.u32 %r919, %r916, 31; | |
shl.b32 %r920, %r915, 1; | |
or.b32 %r921, %r917, %r918; | |
or.b32 %r922, %r919, %r920; | |
mov.b64 %rd919, {%r922, %r921}; | |
ld.local.u64 %rd920, [%rd57]; | |
add.s64 %rd921, %rd866, %rd920; | |
add.s64 %rd922, %rd921, %rd855; | |
xor.b64 %rd923, %rd922, %rd820; | |
mov.b64 {%r923, %r924}, %rd923; | |
mov.b64 %rd924, {%r924, %r923}; | |
add.s64 %rd925, %rd924, %rd837; | |
xor.b64 %rd926, %rd925, %rd855; | |
mov.b64 {%r925, %r926}, %rd926; | |
shr.u32 %r927, %r926, 24; | |
shl.b32 %r928, %r925, 8; | |
shr.u32 %r929, %r925, 24; | |
shl.b32 %r930, %r926, 8; | |
or.b32 %r931, %r927, %r928; | |
or.b32 %r932, %r929, %r930; | |
mov.b64 %rd927, {%r932, %r931}; | |
ld.local.u64 %rd928, [%rd58]; | |
add.s64 %rd929, %rd922, %rd928; | |
add.s64 %rd930, %rd929, %rd927; | |
xor.b64 %rd931, %rd930, %rd924; | |
mov.b64 {%r933, %r934}, %rd931; | |
shr.u32 %r935, %r934, 16; | |
shl.b32 %r936, %r933, 16; | |
shr.u32 %r937, %r933, 16; | |
shl.b32 %r938, %r934, 16; | |
or.b32 %r939, %r935, %r936; | |
or.b32 %r940, %r937, %r938; | |
mov.b64 %rd932, {%r940, %r939}; | |
add.s64 %rd933, %rd932, %rd925; | |
xor.b64 %rd934, %rd933, %rd927; | |
mov.b64 {%r941, %r942}, %rd934; | |
shr.u32 %r943, %r941, 31; | |
shl.b32 %r944, %r942, 1; | |
shr.u32 %r945, %r942, 31; | |
shl.b32 %r946, %r941, 1; | |
or.b32 %r947, %r943, %r944; | |
or.b32 %r948, %r945, %r946; | |
mov.b64 %rd935, {%r948, %r947}; | |
ld.local.u64 %rd936, [%rd59]; | |
add.s64 %rd937, %rd882, %rd936; | |
add.s64 %rd938, %rd937, %rd903; | |
xor.b64 %rd939, %rd938, %rd932; | |
mov.b64 {%r949, %r950}, %rd939; | |
mov.b64 %rd940, {%r950, %r949}; | |
add.s64 %rd941, %rd940, %rd917; | |
xor.b64 %rd942, %rd941, %rd903; | |
mov.b64 {%r951, %r952}, %rd942; | |
shr.u32 %r953, %r952, 24; | |
shl.b32 %r954, %r951, 8; | |
shr.u32 %r955, %r951, 24; | |
shl.b32 %r956, %r952, 8; | |
or.b32 %r957, %r953, %r954; | |
or.b32 %r958, %r955, %r956; | |
mov.b64 %rd943, {%r958, %r957}; | |
ld.local.u64 %rd944, [%rd60]; | |
add.s64 %rd945, %rd938, %rd944; | |
add.s64 %rd946, %rd945, %rd943; | |
xor.b64 %rd947, %rd946, %rd940; | |
mov.b64 {%r959, %r960}, %rd947; | |
shr.u32 %r961, %r960, 16; | |
shl.b32 %r962, %r959, 16; | |
shr.u32 %r963, %r959, 16; | |
shl.b32 %r964, %r960, 16; | |
or.b32 %r965, %r961, %r962; | |
or.b32 %r966, %r963, %r964; | |
mov.b64 %rd948, {%r966, %r965}; | |
add.s64 %rd949, %rd948, %rd941; | |
xor.b64 %rd950, %rd949, %rd943; | |
mov.b64 {%r967, %r968}, %rd950; | |
shr.u32 %r969, %r967, 31; | |
shl.b32 %r970, %r968, 1; | |
shr.u32 %r971, %r968, 31; | |
shl.b32 %r972, %r967, 1; | |
or.b32 %r973, %r969, %r970; | |
or.b32 %r974, %r971, %r972; | |
mov.b64 %rd951, {%r974, %r973}; | |
ld.local.u64 %rd952, [%rd61]; | |
add.s64 %rd953, %rd898, %rd952; | |
add.s64 %rd954, %rd953, %rd919; | |
xor.b64 %rd955, %rd954, %rd884; | |
mov.b64 {%r975, %r976}, %rd955; | |
mov.b64 %rd956, {%r976, %r975}; | |
add.s64 %rd957, %rd956, %rd933; | |
xor.b64 %rd958, %rd957, %rd919; | |
mov.b64 {%r977, %r978}, %rd958; | |
shr.u32 %r979, %r978, 24; | |
shl.b32 %r980, %r977, 8; | |
shr.u32 %r981, %r977, 24; | |
shl.b32 %r982, %r978, 8; | |
or.b32 %r983, %r979, %r980; | |
or.b32 %r984, %r981, %r982; | |
mov.b64 %rd959, {%r984, %r983}; | |
ld.local.u64 %rd960, [%rd62]; | |
add.s64 %rd961, %rd954, %rd960; | |
add.s64 %rd962, %rd961, %rd959; | |
xor.b64 %rd963, %rd962, %rd956; | |
mov.b64 {%r985, %r986}, %rd963; | |
shr.u32 %r987, %r986, 16; | |
shl.b32 %r988, %r985, 16; | |
shr.u32 %r989, %r985, 16; | |
shl.b32 %r990, %r986, 16; | |
or.b32 %r991, %r987, %r988; | |
or.b32 %r992, %r989, %r990; | |
mov.b64 %rd964, {%r992, %r991}; | |
add.s64 %rd965, %rd964, %rd957; | |
xor.b64 %rd966, %rd965, %rd959; | |
mov.b64 {%r993, %r994}, %rd966; | |
shr.u32 %r995, %r993, 31; | |
shl.b32 %r996, %r994, 1; | |
shr.u32 %r997, %r994, 31; | |
shl.b32 %r998, %r993, 1; | |
or.b32 %r999, %r995, %r996; | |
or.b32 %r1000, %r997, %r998; | |
mov.b64 %rd967, {%r1000, %r999}; | |
ld.local.u64 %rd968, [%rd63]; | |
add.s64 %rd969, %rd914, %rd968; | |
add.s64 %rd970, %rd969, %rd935; | |
xor.b64 %rd971, %rd970, %rd900; | |
mov.b64 {%r1001, %r1002}, %rd971; | |
mov.b64 %rd972, {%r1002, %r1001}; | |
add.s64 %rd973, %rd972, %rd885; | |
xor.b64 %rd974, %rd973, %rd935; | |
mov.b64 {%r1003, %r1004}, %rd974; | |
shr.u32 %r1005, %r1004, 24; | |
shl.b32 %r1006, %r1003, 8; | |
shr.u32 %r1007, %r1003, 24; | |
shl.b32 %r1008, %r1004, 8; | |
or.b32 %r1009, %r1005, %r1006; | |
or.b32 %r1010, %r1007, %r1008; | |
mov.b64 %rd975, {%r1010, %r1009}; | |
ld.local.u64 %rd976, [%rd64]; | |
add.s64 %rd977, %rd970, %rd976; | |
add.s64 %rd978, %rd977, %rd975; | |
xor.b64 %rd979, %rd978, %rd972; | |
mov.b64 {%r1011, %r1012}, %rd979; | |
shr.u32 %r1013, %r1012, 16; | |
shl.b32 %r1014, %r1011, 16; | |
shr.u32 %r1015, %r1011, 16; | |
shl.b32 %r1016, %r1012, 16; | |
or.b32 %r1017, %r1013, %r1014; | |
or.b32 %r1018, %r1015, %r1016; | |
mov.b64 %rd980, {%r1018, %r1017}; | |
add.s64 %rd981, %rd980, %rd973; | |
xor.b64 %rd982, %rd981, %rd975; | |
mov.b64 {%r1019, %r1020}, %rd982; | |
shr.u32 %r1021, %r1019, 31; | |
shl.b32 %r1022, %r1020, 1; | |
shr.u32 %r1023, %r1020, 31; | |
shl.b32 %r1024, %r1019, 1; | |
or.b32 %r1025, %r1021, %r1022; | |
or.b32 %r1026, %r1023, %r1024; | |
mov.b64 %rd983, {%r1026, %r1025}; | |
ld.local.u64 %rd984, [%rd65]; | |
add.s64 %rd985, %rd930, %rd984; | |
add.s64 %rd986, %rd985, %rd887; | |
xor.b64 %rd987, %rd986, %rd916; | |
mov.b64 {%r1027, %r1028}, %rd987; | |
mov.b64 %rd988, {%r1028, %r1027}; | |
add.s64 %rd989, %rd988, %rd901; | |
xor.b64 %rd990, %rd989, %rd887; | |
mov.b64 {%r1029, %r1030}, %rd990; | |
shr.u32 %r1031, %r1030, 24; | |
shl.b32 %r1032, %r1029, 8; | |
shr.u32 %r1033, %r1029, 24; | |
shl.b32 %r1034, %r1030, 8; | |
or.b32 %r1035, %r1031, %r1032; | |
or.b32 %r1036, %r1033, %r1034; | |
mov.b64 %rd991, {%r1036, %r1035}; | |
ld.local.u64 %rd992, [%rd66]; | |
add.s64 %rd993, %rd986, %rd992; | |
add.s64 %rd994, %rd993, %rd991; | |
xor.b64 %rd995, %rd994, %rd988; | |
mov.b64 {%r1037, %r1038}, %rd995; | |
shr.u32 %r1039, %r1038, 16; | |
shl.b32 %r1040, %r1037, 16; | |
shr.u32 %r1041, %r1037, 16; | |
shl.b32 %r1042, %r1038, 16; | |
or.b32 %r1043, %r1039, %r1040; | |
or.b32 %r1044, %r1041, %r1042; | |
mov.b64 %rd996, {%r1044, %r1043}; | |
add.s64 %rd997, %rd996, %rd989; | |
xor.b64 %rd998, %rd997, %rd991; | |
mov.b64 {%r1045, %r1046}, %rd998; | |
shr.u32 %r1047, %r1045, 31; | |
shl.b32 %r1048, %r1046, 1; | |
shr.u32 %r1049, %r1046, 31; | |
shl.b32 %r1050, %r1045, 1; | |
or.b32 %r1051, %r1047, %r1048; | |
or.b32 %r1052, %r1049, %r1050; | |
mov.b64 %rd999, {%r1052, %r1051}; | |
ld.local.u64 %rd1000, [%rd67]; | |
add.s64 %rd1001, %rd946, %rd1000; | |
add.s64 %rd1002, %rd1001, %rd999; | |
xor.b64 %rd1003, %rd1002, %rd964; | |
mov.b64 {%r1053, %r1054}, %rd1003; | |
mov.b64 %rd1004, {%r1054, %r1053}; | |
add.s64 %rd1005, %rd1004, %rd981; | |
xor.b64 %rd1006, %rd1005, %rd999; | |
mov.b64 {%r1055, %r1056}, %rd1006; | |
shr.u32 %r1057, %r1056, 24; | |
shl.b32 %r1058, %r1055, 8; | |
shr.u32 %r1059, %r1055, 24; | |
shl.b32 %r1060, %r1056, 8; | |
or.b32 %r1061, %r1057, %r1058; | |
or.b32 %r1062, %r1059, %r1060; | |
mov.b64 %rd1007, {%r1062, %r1061}; | |
ld.local.u64 %rd1008, [%rd68]; | |
add.s64 %rd1009, %rd1002, %rd1008; | |
add.s64 %rd1010, %rd1009, %rd1007; | |
xor.b64 %rd1011, %rd1010, %rd1004; | |
mov.b64 {%r1063, %r1064}, %rd1011; | |
shr.u32 %r1065, %r1064, 16; | |
shl.b32 %r1066, %r1063, 16; | |
shr.u32 %r1067, %r1063, 16; | |
shl.b32 %r1068, %r1064, 16; | |
or.b32 %r1069, %r1065, %r1066; | |
or.b32 %r1070, %r1067, %r1068; | |
mov.b64 %rd1012, {%r1070, %r1069}; | |
add.s64 %rd1013, %rd1012, %rd1005; | |
xor.b64 %rd1014, %rd1013, %rd1007; | |
mov.b64 {%r1071, %r1072}, %rd1014; | |
shr.u32 %r1073, %r1071, 31; | |
shl.b32 %r1074, %r1072, 1; | |
shr.u32 %r1075, %r1072, 31; | |
shl.b32 %r1076, %r1071, 1; | |
or.b32 %r1077, %r1073, %r1074; | |
or.b32 %r1078, %r1075, %r1076; | |
mov.b64 %rd1015, {%r1078, %r1077}; | |
ld.local.u64 %rd1016, [%rd69]; | |
add.s64 %rd1017, %rd962, %rd1016; | |
add.s64 %rd1018, %rd1017, %rd951; | |
xor.b64 %rd1019, %rd1018, %rd980; | |
mov.b64 {%r1079, %r1080}, %rd1019; | |
mov.b64 %rd1020, {%r1080, %r1079}; | |
add.s64 %rd1021, %rd1020, %rd997; | |
xor.b64 %rd1022, %rd1021, %rd951; | |
mov.b64 {%r1081, %r1082}, %rd1022; | |
shr.u32 %r1083, %r1082, 24; | |
shl.b32 %r1084, %r1081, 8; | |
shr.u32 %r1085, %r1081, 24; | |
shl.b32 %r1086, %r1082, 8; | |
or.b32 %r1087, %r1083, %r1084; | |
or.b32 %r1088, %r1085, %r1086; | |
mov.b64 %rd1023, {%r1088, %r1087}; | |
ld.local.u64 %rd1024, [%rd70]; | |
add.s64 %rd1025, %rd1018, %rd1024; | |
add.s64 %rd1026, %rd1025, %rd1023; | |
xor.b64 %rd1027, %rd1026, %rd1020; | |
mov.b64 {%r1089, %r1090}, %rd1027; | |
shr.u32 %r1091, %r1090, 16; | |
shl.b32 %r1092, %r1089, 16; | |
shr.u32 %r1093, %r1089, 16; | |
shl.b32 %r1094, %r1090, 16; | |
or.b32 %r1095, %r1091, %r1092; | |
or.b32 %r1096, %r1093, %r1094; | |
mov.b64 %rd1028, {%r1096, %r1095}; | |
add.s64 %rd1029, %rd1028, %rd1021; | |
xor.b64 %rd1030, %rd1029, %rd1023; | |
mov.b64 {%r1097, %r1098}, %rd1030; | |
shr.u32 %r1099, %r1097, 31; | |
shl.b32 %r1100, %r1098, 1; | |
shr.u32 %r1101, %r1098, 31; | |
shl.b32 %r1102, %r1097, 1; | |
or.b32 %r1103, %r1099, %r1100; | |
or.b32 %r1104, %r1101, %r1102; | |
mov.b64 %rd1031, {%r1104, %r1103}; | |
ld.local.u64 %rd1032, [%rd71]; | |
add.s64 %rd1033, %rd978, %rd1032; | |
add.s64 %rd1034, %rd1033, %rd967; | |
xor.b64 %rd1035, %rd1034, %rd996; | |
mov.b64 {%r1105, %r1106}, %rd1035; | |
mov.b64 %rd1036, {%r1106, %r1105}; | |
add.s64 %rd1037, %rd1036, %rd949; | |
xor.b64 %rd1038, %rd1037, %rd967; | |
mov.b64 {%r1107, %r1108}, %rd1038; | |
shr.u32 %r1109, %r1108, 24; | |
shl.b32 %r1110, %r1107, 8; | |
shr.u32 %r1111, %r1107, 24; | |
shl.b32 %r1112, %r1108, 8; | |
or.b32 %r1113, %r1109, %r1110; | |
or.b32 %r1114, %r1111, %r1112; | |
mov.b64 %rd1039, {%r1114, %r1113}; | |
ld.local.u64 %rd1040, [%rd72]; | |
add.s64 %rd1041, %rd1034, %rd1040; | |
add.s64 %rd1042, %rd1041, %rd1039; | |
xor.b64 %rd1043, %rd1042, %rd1036; | |
mov.b64 {%r1115, %r1116}, %rd1043; | |
shr.u32 %r1117, %r1116, 16; | |
shl.b32 %r1118, %r1115, 16; | |
shr.u32 %r1119, %r1115, 16; | |
shl.b32 %r1120, %r1116, 16; | |
or.b32 %r1121, %r1117, %r1118; | |
or.b32 %r1122, %r1119, %r1120; | |
mov.b64 %rd1044, {%r1122, %r1121}; | |
add.s64 %rd1045, %rd1044, %rd1037; | |
xor.b64 %rd1046, %rd1045, %rd1039; | |
mov.b64 {%r1123, %r1124}, %rd1046; | |
shr.u32 %r1125, %r1123, 31; | |
shl.b32 %r1126, %r1124, 1; | |
shr.u32 %r1127, %r1124, 31; | |
shl.b32 %r1128, %r1123, 1; | |
or.b32 %r1129, %r1125, %r1126; | |
or.b32 %r1130, %r1127, %r1128; | |
mov.b64 %rd1047, {%r1130, %r1129}; | |
ld.local.u64 %rd1048, [%rd73]; | |
add.s64 %rd1049, %rd994, %rd1048; | |
add.s64 %rd1050, %rd1049, %rd983; | |
xor.b64 %rd1051, %rd1050, %rd948; | |
mov.b64 {%r1131, %r1132}, %rd1051; | |
mov.b64 %rd1052, {%r1132, %r1131}; | |
add.s64 %rd1053, %rd1052, %rd965; | |
xor.b64 %rd1054, %rd1053, %rd983; | |
mov.b64 {%r1133, %r1134}, %rd1054; | |
shr.u32 %r1135, %r1134, 24; | |
shl.b32 %r1136, %r1133, 8; | |
shr.u32 %r1137, %r1133, 24; | |
shl.b32 %r1138, %r1134, 8; | |
or.b32 %r1139, %r1135, %r1136; | |
or.b32 %r1140, %r1137, %r1138; | |
mov.b64 %rd1055, {%r1140, %r1139}; | |
ld.local.u64 %rd1056, [%rd74]; | |
add.s64 %rd1057, %rd1050, %rd1056; | |
add.s64 %rd1058, %rd1057, %rd1055; | |
xor.b64 %rd1059, %rd1058, %rd1052; | |
mov.b64 {%r1141, %r1142}, %rd1059; | |
shr.u32 %r1143, %r1142, 16; | |
shl.b32 %r1144, %r1141, 16; | |
shr.u32 %r1145, %r1141, 16; | |
shl.b32 %r1146, %r1142, 16; | |
or.b32 %r1147, %r1143, %r1144; | |
or.b32 %r1148, %r1145, %r1146; | |
mov.b64 %rd1060, {%r1148, %r1147}; | |
add.s64 %rd1061, %rd1060, %rd1053; | |
xor.b64 %rd1062, %rd1061, %rd1055; | |
mov.b64 {%r1149, %r1150}, %rd1062; | |
shr.u32 %r1151, %r1149, 31; | |
shl.b32 %r1152, %r1150, 1; | |
shr.u32 %r1153, %r1150, 31; | |
shl.b32 %r1154, %r1149, 1; | |
or.b32 %r1155, %r1151, %r1152; | |
or.b32 %r1156, %r1153, %r1154; | |
mov.b64 %rd1063, {%r1156, %r1155}; | |
ld.local.u64 %rd1064, [%rd75]; | |
add.s64 %rd1065, %rd1010, %rd1064; | |
add.s64 %rd1066, %rd1065, %rd1031; | |
xor.b64 %rd1067, %rd1066, %rd1060; | |
mov.b64 {%r1157, %r1158}, %rd1067; | |
mov.b64 %rd1068, {%r1158, %r1157}; | |
add.s64 %rd1069, %rd1068, %rd1045; | |
xor.b64 %rd1070, %rd1069, %rd1031; | |
mov.b64 {%r1159, %r1160}, %rd1070; | |
shr.u32 %r1161, %r1160, 24; | |
shl.b32 %r1162, %r1159, 8; | |
shr.u32 %r1163, %r1159, 24; | |
shl.b32 %r1164, %r1160, 8; | |
or.b32 %r1165, %r1161, %r1162; | |
or.b32 %r1166, %r1163, %r1164; | |
mov.b64 %rd1071, {%r1166, %r1165}; | |
ld.local.u64 %rd1072, [%rd76]; | |
add.s64 %rd1073, %rd1066, %rd1072; | |
add.s64 %rd1074, %rd1073, %rd1071; | |
xor.b64 %rd1075, %rd1074, %rd1068; | |
mov.b64 {%r1167, %r1168}, %rd1075; | |
shr.u32 %r1169, %r1168, 16; | |
shl.b32 %r1170, %r1167, 16; | |
shr.u32 %r1171, %r1167, 16; | |
shl.b32 %r1172, %r1168, 16; | |
or.b32 %r1173, %r1169, %r1170; | |
or.b32 %r1174, %r1171, %r1172; | |
mov.b64 %rd1076, {%r1174, %r1173}; | |
add.s64 %rd1077, %rd1076, %rd1069; | |
xor.b64 %rd1078, %rd1077, %rd1071; | |
mov.b64 {%r1175, %r1176}, %rd1078; | |
shr.u32 %r1177, %r1175, 31; | |
shl.b32 %r1178, %r1176, 1; | |
shr.u32 %r1179, %r1176, 31; | |
shl.b32 %r1180, %r1175, 1; | |
or.b32 %r1181, %r1177, %r1178; | |
or.b32 %r1182, %r1179, %r1180; | |
mov.b64 %rd1079, {%r1182, %r1181}; | |
ld.local.u64 %rd1080, [%rd77]; | |
add.s64 %rd1081, %rd1026, %rd1080; | |
add.s64 %rd1082, %rd1081, %rd1047; | |
xor.b64 %rd1083, %rd1082, %rd1012; | |
mov.b64 {%r1183, %r1184}, %rd1083; | |
mov.b64 %rd1084, {%r1184, %r1183}; | |
add.s64 %rd1085, %rd1084, %rd1061; | |
xor.b64 %rd1086, %rd1085, %rd1047; | |
mov.b64 {%r1185, %r1186}, %rd1086; | |
shr.u32 %r1187, %r1186, 24; | |
shl.b32 %r1188, %r1185, 8; | |
shr.u32 %r1189, %r1185, 24; | |
shl.b32 %r1190, %r1186, 8; | |
or.b32 %r1191, %r1187, %r1188; | |
or.b32 %r1192, %r1189, %r1190; | |
mov.b64 %rd1087, {%r1192, %r1191}; | |
ld.local.u64 %rd1088, [%rd78]; | |
add.s64 %rd1089, %rd1082, %rd1088; | |
add.s64 %rd1090, %rd1089, %rd1087; | |
xor.b64 %rd1091, %rd1090, %rd1084; | |
mov.b64 {%r1193, %r1194}, %rd1091; | |
shr.u32 %r1195, %r1194, 16; | |
shl.b32 %r1196, %r1193, 16; | |
shr.u32 %r1197, %r1193, 16; | |
shl.b32 %r1198, %r1194, 16; | |
or.b32 %r1199, %r1195, %r1196; | |
or.b32 %r1200, %r1197, %r1198; | |
mov.b64 %rd1092, {%r1200, %r1199}; | |
add.s64 %rd1093, %rd1092, %rd1085; | |
xor.b64 %rd1094, %rd1093, %rd1087; | |
mov.b64 {%r1201, %r1202}, %rd1094; | |
shr.u32 %r1203, %r1201, 31; | |
shl.b32 %r1204, %r1202, 1; | |
shr.u32 %r1205, %r1202, 31; | |
shl.b32 %r1206, %r1201, 1; | |
or.b32 %r1207, %r1203, %r1204; | |
or.b32 %r1208, %r1205, %r1206; | |
mov.b64 %rd1095, {%r1208, %r1207}; | |
ld.local.u64 %rd1096, [%rd79]; | |
add.s64 %rd1097, %rd1042, %rd1096; | |
add.s64 %rd1098, %rd1097, %rd1063; | |
xor.b64 %rd1099, %rd1098, %rd1028; | |
mov.b64 {%r1209, %r1210}, %rd1099; | |
mov.b64 %rd1100, {%r1210, %r1209}; | |
add.s64 %rd1101, %rd1100, %rd1013; | |
xor.b64 %rd1102, %rd1101, %rd1063; | |
mov.b64 {%r1211, %r1212}, %rd1102; | |
shr.u32 %r1213, %r1212, 24; | |
shl.b32 %r1214, %r1211, 8; | |
shr.u32 %r1215, %r1211, 24; | |
shl.b32 %r1216, %r1212, 8; | |
or.b32 %r1217, %r1213, %r1214; | |
or.b32 %r1218, %r1215, %r1216; | |
mov.b64 %rd1103, {%r1218, %r1217}; | |
ld.local.u64 %rd1104, [%rd80]; | |
add.s64 %rd1105, %rd1098, %rd1104; | |
add.s64 %rd1106, %rd1105, %rd1103; | |
xor.b64 %rd1107, %rd1106, %rd1100; | |
mov.b64 {%r1219, %r1220}, %rd1107; | |
shr.u32 %r1221, %r1220, 16; | |
shl.b32 %r1222, %r1219, 16; | |
shr.u32 %r1223, %r1219, 16; | |
shl.b32 %r1224, %r1220, 16; | |
or.b32 %r1225, %r1221, %r1222; | |
or.b32 %r1226, %r1223, %r1224; | |
mov.b64 %rd1108, {%r1226, %r1225}; | |
add.s64 %rd1109, %rd1108, %rd1101; | |
xor.b64 %rd1110, %rd1109, %rd1103; | |
mov.b64 {%r1227, %r1228}, %rd1110; | |
shr.u32 %r1229, %r1227, 31; | |
shl.b32 %r1230, %r1228, 1; | |
shr.u32 %r1231, %r1228, 31; | |
shl.b32 %r1232, %r1227, 1; | |
or.b32 %r1233, %r1229, %r1230; | |
or.b32 %r1234, %r1231, %r1232; | |
mov.b64 %rd1111, {%r1234, %r1233}; | |
ld.local.u64 %rd1112, [%rd81]; | |
add.s64 %rd1113, %rd1058, %rd1112; | |
add.s64 %rd1114, %rd1113, %rd1015; | |
xor.b64 %rd1115, %rd1114, %rd1044; | |
mov.b64 {%r1235, %r1236}, %rd1115; | |
mov.b64 %rd1116, {%r1236, %r1235}; | |
add.s64 %rd1117, %rd1116, %rd1029; | |
xor.b64 %rd1118, %rd1117, %rd1015; | |
mov.b64 {%r1237, %r1238}, %rd1118; | |
shr.u32 %r1239, %r1238, 24; | |
shl.b32 %r1240, %r1237, 8; | |
shr.u32 %r1241, %r1237, 24; | |
shl.b32 %r1242, %r1238, 8; | |
or.b32 %r1243, %r1239, %r1240; | |
or.b32 %r1244, %r1241, %r1242; | |
mov.b64 %rd1119, {%r1244, %r1243}; | |
ld.local.u64 %rd1120, [%rd82]; | |
add.s64 %rd1121, %rd1114, %rd1120; | |
add.s64 %rd1122, %rd1121, %rd1119; | |
xor.b64 %rd1123, %rd1122, %rd1116; | |
mov.b64 {%r1245, %r1246}, %rd1123; | |
shr.u32 %r1247, %r1246, 16; | |
shl.b32 %r1248, %r1245, 16; | |
shr.u32 %r1249, %r1245, 16; | |
shl.b32 %r1250, %r1246, 16; | |
or.b32 %r1251, %r1247, %r1248; | |
or.b32 %r1252, %r1249, %r1250; | |
mov.b64 %rd1124, {%r1252, %r1251}; | |
add.s64 %rd1125, %rd1124, %rd1117; | |
xor.b64 %rd1126, %rd1125, %rd1119; | |
mov.b64 {%r1253, %r1254}, %rd1126; | |
shr.u32 %r1255, %r1253, 31; | |
shl.b32 %r1256, %r1254, 1; | |
shr.u32 %r1257, %r1254, 31; | |
shl.b32 %r1258, %r1253, 1; | |
or.b32 %r1259, %r1255, %r1256; | |
or.b32 %r1260, %r1257, %r1258; | |
mov.b64 %rd1127, {%r1260, %r1259}; | |
ld.local.u64 %rd1128, [%rd83]; | |
add.s64 %rd1129, %rd1074, %rd1128; | |
add.s64 %rd1130, %rd1129, %rd1127; | |
xor.b64 %rd1131, %rd1130, %rd1092; | |
mov.b64 {%r1261, %r1262}, %rd1131; | |
mov.b64 %rd1132, {%r1262, %r1261}; | |
add.s64 %rd1133, %rd1132, %rd1109; | |
xor.b64 %rd1134, %rd1133, %rd1127; | |
mov.b64 {%r1263, %r1264}, %rd1134; | |
shr.u32 %r1265, %r1264, 24; | |
shl.b32 %r1266, %r1263, 8; | |
shr.u32 %r1267, %r1263, 24; | |
shl.b32 %r1268, %r1264, 8; | |
or.b32 %r1269, %r1265, %r1266; | |
or.b32 %r1270, %r1267, %r1268; | |
mov.b64 %rd1135, {%r1270, %r1269}; | |
ld.local.u64 %rd1136, [%rd84]; | |
add.s64 %rd1137, %rd1130, %rd1136; | |
add.s64 %rd1138, %rd1137, %rd1135; | |
xor.b64 %rd1139, %rd1138, %rd1132; | |
mov.b64 {%r1271, %r1272}, %rd1139; | |
shr.u32 %r1273, %r1272, 16; | |
shl.b32 %r1274, %r1271, 16; | |
shr.u32 %r1275, %r1271, 16; | |
shl.b32 %r1276, %r1272, 16; | |
or.b32 %r1277, %r1273, %r1274; | |
or.b32 %r1278, %r1275, %r1276; | |
mov.b64 %rd1140, {%r1278, %r1277}; | |
add.s64 %rd1141, %rd1140, %rd1133; | |
xor.b64 %rd1142, %rd1141, %rd1135; | |
mov.b64 {%r1279, %r1280}, %rd1142; | |
shr.u32 %r1281, %r1279, 31; | |
shl.b32 %r1282, %r1280, 1; | |
shr.u32 %r1283, %r1280, 31; | |
shl.b32 %r1284, %r1279, 1; | |
or.b32 %r1285, %r1281, %r1282; | |
or.b32 %r1286, %r1283, %r1284; | |
mov.b64 %rd1143, {%r1286, %r1285}; | |
ld.local.u64 %rd1144, [%rd85]; | |
add.s64 %rd1145, %rd1090, %rd1144; | |
add.s64 %rd1146, %rd1145, %rd1079; | |
xor.b64 %rd1147, %rd1146, %rd1108; | |
mov.b64 {%r1287, %r1288}, %rd1147; | |
mov.b64 %rd1148, {%r1288, %r1287}; | |
add.s64 %rd1149, %rd1148, %rd1125; | |
xor.b64 %rd1150, %rd1149, %rd1079; | |
mov.b64 {%r1289, %r1290}, %rd1150; | |
shr.u32 %r1291, %r1290, 24; | |
shl.b32 %r1292, %r1289, 8; | |
shr.u32 %r1293, %r1289, 24; | |
shl.b32 %r1294, %r1290, 8; | |
or.b32 %r1295, %r1291, %r1292; | |
or.b32 %r1296, %r1293, %r1294; | |
mov.b64 %rd1151, {%r1296, %r1295}; | |
ld.local.u64 %rd1152, [%rd86]; | |
add.s64 %rd1153, %rd1146, %rd1152; | |
add.s64 %rd1154, %rd1153, %rd1151; | |
xor.b64 %rd1155, %rd1154, %rd1148; | |
mov.b64 {%r1297, %r1298}, %rd1155; | |
shr.u32 %r1299, %r1298, 16; | |
shl.b32 %r1300, %r1297, 16; | |
shr.u32 %r1301, %r1297, 16; | |
shl.b32 %r1302, %r1298, 16; | |
or.b32 %r1303, %r1299, %r1300; | |
or.b32 %r1304, %r1301, %r1302; | |
mov.b64 %rd1156, {%r1304, %r1303}; | |
add.s64 %rd1157, %rd1156, %rd1149; | |
xor.b64 %rd1158, %rd1157, %rd1151; | |
mov.b64 {%r1305, %r1306}, %rd1158; | |
shr.u32 %r1307, %r1305, 31; | |
shl.b32 %r1308, %r1306, 1; | |
shr.u32 %r1309, %r1306, 31; | |
shl.b32 %r1310, %r1305, 1; | |
or.b32 %r1311, %r1307, %r1308; | |
or.b32 %r1312, %r1309, %r1310; | |
mov.b64 %rd1159, {%r1312, %r1311}; | |
ld.local.u64 %rd1160, [%rd87]; | |
add.s64 %rd1161, %rd1106, %rd1160; | |
add.s64 %rd1162, %rd1161, %rd1095; | |
xor.b64 %rd1163, %rd1162, %rd1124; | |
mov.b64 {%r1313, %r1314}, %rd1163; | |
mov.b64 %rd1164, {%r1314, %r1313}; | |
add.s64 %rd1165, %rd1164, %rd1077; | |
xor.b64 %rd1166, %rd1165, %rd1095; | |
mov.b64 {%r1315, %r1316}, %rd1166; | |
shr.u32 %r1317, %r1316, 24; | |
shl.b32 %r1318, %r1315, 8; | |
shr.u32 %r1319, %r1315, 24; | |
shl.b32 %r1320, %r1316, 8; | |
or.b32 %r1321, %r1317, %r1318; | |
or.b32 %r1322, %r1319, %r1320; | |
mov.b64 %rd1167, {%r1322, %r1321}; | |
ld.local.u64 %rd1168, [%rd88]; | |
add.s64 %rd1169, %rd1162, %rd1168; | |
add.s64 %rd1170, %rd1169, %rd1167; | |
xor.b64 %rd1171, %rd1170, %rd1164; | |
mov.b64 {%r1323, %r1324}, %rd1171; | |
shr.u32 %r1325, %r1324, 16; | |
shl.b32 %r1326, %r1323, 16; | |
shr.u32 %r1327, %r1323, 16; | |
shl.b32 %r1328, %r1324, 16; | |
or.b32 %r1329, %r1325, %r1326; | |
or.b32 %r1330, %r1327, %r1328; | |
mov.b64 %rd1172, {%r1330, %r1329}; | |
add.s64 %rd1173, %rd1172, %rd1165; | |
xor.b64 %rd1174, %rd1173, %rd1167; | |
mov.b64 {%r1331, %r1332}, %rd1174; | |
shr.u32 %r1333, %r1331, 31; | |
shl.b32 %r1334, %r1332, 1; | |
shr.u32 %r1335, %r1332, 31; | |
shl.b32 %r1336, %r1331, 1; | |
or.b32 %r1337, %r1333, %r1334; | |
or.b32 %r1338, %r1335, %r1336; | |
mov.b64 %rd1175, {%r1338, %r1337}; | |
ld.local.u64 %rd1176, [%rd89]; | |
add.s64 %rd1177, %rd1122, %rd1176; | |
add.s64 %rd1178, %rd1177, %rd1111; | |
xor.b64 %rd1179, %rd1178, %rd1076; | |
mov.b64 {%r1339, %r1340}, %rd1179; | |
mov.b64 %rd1180, {%r1340, %r1339}; | |
add.s64 %rd1181, %rd1180, %rd1093; | |
xor.b64 %rd1182, %rd1181, %rd1111; | |
mov.b64 {%r1341, %r1342}, %rd1182; | |
shr.u32 %r1343, %r1342, 24; | |
shl.b32 %r1344, %r1341, 8; | |
shr.u32 %r1345, %r1341, 24; | |
shl.b32 %r1346, %r1342, 8; | |
or.b32 %r1347, %r1343, %r1344; | |
or.b32 %r1348, %r1345, %r1346; | |
mov.b64 %rd1183, {%r1348, %r1347}; | |
ld.local.u64 %rd1184, [%rd90]; | |
add.s64 %rd1185, %rd1178, %rd1184; | |
add.s64 %rd1186, %rd1185, %rd1183; | |
xor.b64 %rd1187, %rd1186, %rd1180; | |
mov.b64 {%r1349, %r1350}, %rd1187; | |
shr.u32 %r1351, %r1350, 16; | |
shl.b32 %r1352, %r1349, 16; | |
shr.u32 %r1353, %r1349, 16; | |
shl.b32 %r1354, %r1350, 16; | |
or.b32 %r1355, %r1351, %r1352; | |
or.b32 %r1356, %r1353, %r1354; | |
mov.b64 %rd1188, {%r1356, %r1355}; | |
add.s64 %rd1189, %rd1188, %rd1181; | |
xor.b64 %rd1190, %rd1189, %rd1183; | |
mov.b64 {%r1357, %r1358}, %rd1190; | |
shr.u32 %r1359, %r1357, 31; | |
shl.b32 %r1360, %r1358, 1; | |
shr.u32 %r1361, %r1358, 31; | |
shl.b32 %r1362, %r1357, 1; | |
or.b32 %r1363, %r1359, %r1360; | |
or.b32 %r1364, %r1361, %r1362; | |
mov.b64 %rd1191, {%r1364, %r1363}; | |
ld.local.u64 %rd1192, [%rd91]; | |
add.s64 %rd1193, %rd1138, %rd1192; | |
add.s64 %rd1194, %rd1193, %rd1159; | |
xor.b64 %rd1195, %rd1194, %rd1188; | |
mov.b64 {%r1365, %r1366}, %rd1195; | |
mov.b64 %rd1196, {%r1366, %r1365}; | |
add.s64 %rd1197, %rd1196, %rd1173; | |
xor.b64 %rd1198, %rd1197, %rd1159; | |
mov.b64 {%r1367, %r1368}, %rd1198; | |
shr.u32 %r1369, %r1368, 24; | |
shl.b32 %r1370, %r1367, 8; | |
shr.u32 %r1371, %r1367, 24; | |
shl.b32 %r1372, %r1368, 8; | |
or.b32 %r1373, %r1369, %r1370; | |
or.b32 %r1374, %r1371, %r1372; | |
mov.b64 %rd1199, {%r1374, %r1373}; | |
ld.local.u64 %rd1200, [%rd92]; | |
add.s64 %rd1201, %rd1194, %rd1200; | |
add.s64 %rd1202, %rd1201, %rd1199; | |
xor.b64 %rd1203, %rd1202, %rd1196; | |
mov.b64 {%r1375, %r1376}, %rd1203; | |
shr.u32 %r1377, %r1376, 16; | |
shl.b32 %r1378, %r1375, 16; | |
shr.u32 %r1379, %r1375, 16; | |
shl.b32 %r1380, %r1376, 16; | |
or.b32 %r1381, %r1377, %r1378; | |
or.b32 %r1382, %r1379, %r1380; | |
mov.b64 %rd1204, {%r1382, %r1381}; | |
add.s64 %rd1205, %rd1204, %rd1197; | |
xor.b64 %rd1206, %rd1205, %rd1199; | |
mov.b64 {%r1383, %r1384}, %rd1206; | |
shr.u32 %r1385, %r1383, 31; | |
shl.b32 %r1386, %r1384, 1; | |
shr.u32 %r1387, %r1384, 31; | |
shl.b32 %r1388, %r1383, 1; | |
or.b32 %r1389, %r1385, %r1386; | |
or.b32 %r1390, %r1387, %r1388; | |
mov.b64 %rd1207, {%r1390, %r1389}; | |
ld.local.u64 %rd1208, [%rd93]; | |
add.s64 %rd1209, %rd1154, %rd1208; | |
add.s64 %rd1210, %rd1209, %rd1175; | |
xor.b64 %rd1211, %rd1210, %rd1140; | |
mov.b64 {%r1391, %r1392}, %rd1211; | |
mov.b64 %rd1212, {%r1392, %r1391}; | |
add.s64 %rd1213, %rd1212, %rd1189; | |
xor.b64 %rd1214, %rd1213, %rd1175; | |
mov.b64 {%r1393, %r1394}, %rd1214; | |
shr.u32 %r1395, %r1394, 24; | |
shl.b32 %r1396, %r1393, 8; | |
shr.u32 %r1397, %r1393, 24; | |
shl.b32 %r1398, %r1394, 8; | |
or.b32 %r1399, %r1395, %r1396; | |
or.b32 %r1400, %r1397, %r1398; | |
mov.b64 %rd1215, {%r1400, %r1399}; | |
ld.local.u64 %rd1216, [%rd94]; | |
add.s64 %rd1217, %rd1210, %rd1216; | |
add.s64 %rd1218, %rd1217, %rd1215; | |
xor.b64 %rd1219, %rd1218, %rd1212; | |
mov.b64 {%r1401, %r1402}, %rd1219; | |
shr.u32 %r1403, %r1402, 16; | |
shl.b32 %r1404, %r1401, 16; | |
shr.u32 %r1405, %r1401, 16; | |
shl.b32 %r1406, %r1402, 16; | |
or.b32 %r1407, %r1403, %r1404; | |
or.b32 %r1408, %r1405, %r1406; | |
mov.b64 %rd1220, {%r1408, %r1407}; | |
add.s64 %rd1221, %rd1220, %rd1213; | |
xor.b64 %rd1222, %rd1221, %rd1215; | |
mov.b64 {%r1409, %r1410}, %rd1222; | |
shr.u32 %r1411, %r1409, 31; | |
shl.b32 %r1412, %r1410, 1; | |
shr.u32 %r1413, %r1410, 31; | |
shl.b32 %r1414, %r1409, 1; | |
or.b32 %r1415, %r1411, %r1412; | |
or.b32 %r1416, %r1413, %r1414; | |
mov.b64 %rd1223, {%r1416, %r1415}; | |
ld.local.u64 %rd1224, [%rd95]; | |
add.s64 %rd1225, %rd1170, %rd1224; | |
add.s64 %rd1226, %rd1225, %rd1191; | |
xor.b64 %rd1227, %rd1226, %rd1156; | |
mov.b64 {%r1417, %r1418}, %rd1227; | |
mov.b64 %rd1228, {%r1418, %r1417}; | |
add.s64 %rd1229, %rd1228, %rd1141; | |
xor.b64 %rd1230, %rd1229, %rd1191; | |
mov.b64 {%r1419, %r1420}, %rd1230; | |
shr.u32 %r1421, %r1420, 24; | |
shl.b32 %r1422, %r1419, 8; | |
shr.u32 %r1423, %r1419, 24; | |
shl.b32 %r1424, %r1420, 8; | |
or.b32 %r1425, %r1421, %r1422; | |
or.b32 %r1426, %r1423, %r1424; | |
mov.b64 %rd1231, {%r1426, %r1425}; | |
ld.local.u64 %rd1232, [%rd96]; | |
add.s64 %rd1233, %rd1226, %rd1232; | |
add.s64 %rd1234, %rd1233, %rd1231; | |
xor.b64 %rd1235, %rd1234, %rd1228; | |
mov.b64 {%r1427, %r1428}, %rd1235; | |
shr.u32 %r1429, %r1428, 16; | |
shl.b32 %r1430, %r1427, 16; | |
shr.u32 %r1431, %r1427, 16; | |
shl.b32 %r1432, %r1428, 16; | |
or.b32 %r1433, %r1429, %r1430; | |
or.b32 %r1434, %r1431, %r1432; | |
mov.b64 %rd1236, {%r1434, %r1433}; | |
add.s64 %rd1237, %rd1236, %rd1229; | |
xor.b64 %rd1238, %rd1237, %rd1231; | |
mov.b64 {%r1435, %r1436}, %rd1238; | |
shr.u32 %r1437, %r1435, 31; | |
shl.b32 %r1438, %r1436, 1; | |
shr.u32 %r1439, %r1436, 31; | |
shl.b32 %r1440, %r1435, 1; | |
or.b32 %r1441, %r1437, %r1438; | |
or.b32 %r1442, %r1439, %r1440; | |
mov.b64 %rd1239, {%r1442, %r1441}; | |
ld.local.u64 %rd1240, [%rd97]; | |
add.s64 %rd1241, %rd1186, %rd1240; | |
add.s64 %rd1242, %rd1241, %rd1143; | |
xor.b64 %rd1243, %rd1242, %rd1172; | |
mov.b64 {%r1443, %r1444}, %rd1243; | |
mov.b64 %rd1244, {%r1444, %r1443}; | |
add.s64 %rd1245, %rd1244, %rd1157; | |
xor.b64 %rd1246, %rd1245, %rd1143; | |
mov.b64 {%r1445, %r1446}, %rd1246; | |
shr.u32 %r1447, %r1446, 24; | |
shl.b32 %r1448, %r1445, 8; | |
shr.u32 %r1449, %r1445, 24; | |
shl.b32 %r1450, %r1446, 8; | |
or.b32 %r1451, %r1447, %r1448; | |
or.b32 %r1452, %r1449, %r1450; | |
mov.b64 %rd1247, {%r1452, %r1451}; | |
ld.local.u64 %rd1248, [%rd98]; | |
add.s64 %rd1249, %rd1242, %rd1248; | |
add.s64 %rd1250, %rd1249, %rd1247; | |
xor.b64 %rd1251, %rd1250, %rd1244; | |
mov.b64 {%r1453, %r1454}, %rd1251; | |
shr.u32 %r1455, %r1454, 16; | |
shl.b32 %r1456, %r1453, 16; | |
shr.u32 %r1457, %r1453, 16; | |
shl.b32 %r1458, %r1454, 16; | |
or.b32 %r1459, %r1455, %r1456; | |
or.b32 %r1460, %r1457, %r1458; | |
mov.b64 %rd1252, {%r1460, %r1459}; | |
add.s64 %rd1253, %rd1252, %rd1245; | |
xor.b64 %rd1254, %rd1253, %rd1247; | |
mov.b64 {%r1461, %r1462}, %rd1254; | |
shr.u32 %r1463, %r1461, 31; | |
shl.b32 %r1464, %r1462, 1; | |
shr.u32 %r1465, %r1462, 31; | |
shl.b32 %r1466, %r1461, 1; | |
or.b32 %r1467, %r1463, %r1464; | |
or.b32 %r1468, %r1465, %r1466; | |
mov.b64 %rd1255, {%r1468, %r1467}; | |
ld.local.u64 %rd1256, [%rd99]; | |
add.s64 %rd1257, %rd1202, %rd1256; | |
add.s64 %rd1258, %rd1257, %rd1255; | |
xor.b64 %rd1259, %rd1258, %rd1220; | |
mov.b64 {%r1469, %r1470}, %rd1259; | |
mov.b64 %rd1260, {%r1470, %r1469}; | |
add.s64 %rd1261, %rd1260, %rd1237; | |
xor.b64 %rd1262, %rd1261, %rd1255; | |
mov.b64 {%r1471, %r1472}, %rd1262; | |
shr.u32 %r1473, %r1472, 24; | |
shl.b32 %r1474, %r1471, 8; | |
shr.u32 %r1475, %r1471, 24; | |
shl.b32 %r1476, %r1472, 8; | |
or.b32 %r1477, %r1473, %r1474; | |
or.b32 %r1478, %r1475, %r1476; | |
mov.b64 %rd1263, {%r1478, %r1477}; | |
ld.local.u64 %rd1264, [%rd100]; | |
add.s64 %rd1265, %rd1258, %rd1264; | |
add.s64 %rd1266, %rd1265, %rd1263; | |
xor.b64 %rd1267, %rd1266, %rd1260; | |
mov.b64 {%r1479, %r1480}, %rd1267; | |
shr.u32 %r1481, %r1480, 16; | |
shl.b32 %r1482, %r1479, 16; | |
shr.u32 %r1483, %r1479, 16; | |
shl.b32 %r1484, %r1480, 16; | |
or.b32 %r1485, %r1481, %r1482; | |
or.b32 %r1486, %r1483, %r1484; | |
mov.b64 %rd1268, {%r1486, %r1485}; | |
add.s64 %rd1269, %rd1268, %rd1261; | |
xor.b64 %rd1270, %rd1269, %rd1263; | |
mov.b64 {%r1487, %r1488}, %rd1270; | |
shr.u32 %r1489, %r1487, 31; | |
shl.b32 %r1490, %r1488, 1; | |
shr.u32 %r1491, %r1488, 31; | |
shl.b32 %r1492, %r1487, 1; | |
or.b32 %r1493, %r1489, %r1490; | |
or.b32 %r1494, %r1491, %r1492; | |
mov.b64 %rd1271, {%r1494, %r1493}; | |
ld.local.u64 %rd1272, [%rd101]; | |
add.s64 %rd1273, %rd1218, %rd1272; | |
add.s64 %rd1274, %rd1273, %rd1207; | |
xor.b64 %rd1275, %rd1274, %rd1236; | |
mov.b64 {%r1495, %r1496}, %rd1275; | |
mov.b64 %rd1276, {%r1496, %r1495}; | |
add.s64 %rd1277, %rd1276, %rd1253; | |
xor.b64 %rd1278, %rd1277, %rd1207; | |
mov.b64 {%r1497, %r1498}, %rd1278; | |
shr.u32 %r1499, %r1498, 24; | |
shl.b32 %r1500, %r1497, 8; | |
shr.u32 %r1501, %r1497, 24; | |
shl.b32 %r1502, %r1498, 8; | |
or.b32 %r1503, %r1499, %r1500; | |
or.b32 %r1504, %r1501, %r1502; | |
mov.b64 %rd1279, {%r1504, %r1503}; | |
ld.local.u64 %rd1280, [%rd102]; | |
add.s64 %rd1281, %rd1274, %rd1280; | |
add.s64 %rd1282, %rd1281, %rd1279; | |
xor.b64 %rd1283, %rd1282, %rd1276; | |
mov.b64 {%r1505, %r1506}, %rd1283; | |
shr.u32 %r1507, %r1506, 16; | |
shl.b32 %r1508, %r1505, 16; | |
shr.u32 %r1509, %r1505, 16; | |
shl.b32 %r1510, %r1506, 16; | |
or.b32 %r1511, %r1507, %r1508; | |
or.b32 %r1512, %r1509, %r1510; | |
mov.b64 %rd1284, {%r1512, %r1511}; | |
add.s64 %rd1285, %rd1284, %rd1277; | |
xor.b64 %rd1286, %rd1285, %rd1279; | |
mov.b64 {%r1513, %r1514}, %rd1286; | |
shr.u32 %r1515, %r1513, 31; | |
shl.b32 %r1516, %r1514, 1; | |
shr.u32 %r1517, %r1514, 31; | |
shl.b32 %r1518, %r1513, 1; | |
or.b32 %r1519, %r1515, %r1516; | |
or.b32 %r1520, %r1517, %r1518; | |
mov.b64 %rd1287, {%r1520, %r1519}; | |
ld.local.u64 %rd1288, [%rd103]; | |
add.s64 %rd1289, %rd1234, %rd1288; | |
add.s64 %rd1290, %rd1289, %rd1223; | |
xor.b64 %rd1291, %rd1290, %rd1252; | |
mov.b64 {%r1521, %r1522}, %rd1291; | |
mov.b64 %rd1292, {%r1522, %r1521}; | |
add.s64 %rd1293, %rd1292, %rd1205; | |
xor.b64 %rd1294, %rd1293, %rd1223; | |
mov.b64 {%r1523, %r1524}, %rd1294; | |
shr.u32 %r1525, %r1524, 24; | |
shl.b32 %r1526, %r1523, 8; | |
shr.u32 %r1527, %r1523, 24; | |
shl.b32 %r1528, %r1524, 8; | |
or.b32 %r1529, %r1525, %r1526; | |
or.b32 %r1530, %r1527, %r1528; | |
mov.b64 %rd1295, {%r1530, %r1529}; | |
ld.local.u64 %rd1296, [%rd104]; | |
add.s64 %rd1297, %rd1290, %rd1296; | |
add.s64 %rd1298, %rd1297, %rd1295; | |
xor.b64 %rd1299, %rd1298, %rd1292; | |
mov.b64 {%r1531, %r1532}, %rd1299; | |
shr.u32 %r1533, %r1532, 16; | |
shl.b32 %r1534, %r1531, 16; | |
shr.u32 %r1535, %r1531, 16; | |
shl.b32 %r1536, %r1532, 16; | |
or.b32 %r1537, %r1533, %r1534; | |
or.b32 %r1538, %r1535, %r1536; | |
mov.b64 %rd1300, {%r1538, %r1537}; | |
add.s64 %rd1301, %rd1300, %rd1293; | |
xor.b64 %rd1302, %rd1301, %rd1295; | |
mov.b64 {%r1539, %r1540}, %rd1302; | |
shr.u32 %r1541, %r1539, 31; | |
shl.b32 %r1542, %r1540, 1; | |
shr.u32 %r1543, %r1540, 31; | |
shl.b32 %r1544, %r1539, 1; | |
or.b32 %r1545, %r1541, %r1542; | |
or.b32 %r1546, %r1543, %r1544; | |
mov.b64 %rd1303, {%r1546, %r1545}; | |
ld.local.u64 %rd1304, [%rd105]; | |
add.s64 %rd1305, %rd1250, %rd1304; | |
add.s64 %rd1306, %rd1305, %rd1239; | |
xor.b64 %rd1307, %rd1306, %rd1204; | |
mov.b64 {%r1547, %r1548}, %rd1307; | |
mov.b64 %rd1308, {%r1548, %r1547}; | |
add.s64 %rd1309, %rd1308, %rd1221; | |
xor.b64 %rd1310, %rd1309, %rd1239; | |
mov.b64 {%r1549, %r1550}, %rd1310; | |
shr.u32 %r1551, %r1550, 24; | |
shl.b32 %r1552, %r1549, 8; | |
shr.u32 %r1553, %r1549, 24; | |
shl.b32 %r1554, %r1550, 8; | |
or.b32 %r1555, %r1551, %r1552; | |
or.b32 %r1556, %r1553, %r1554; | |
mov.b64 %rd1311, {%r1556, %r1555}; | |
ld.local.u64 %rd1312, [%rd106]; | |
add.s64 %rd1313, %rd1306, %rd1312; | |
add.s64 %rd1314, %rd1313, %rd1311; | |
xor.b64 %rd1315, %rd1314, %rd1308; | |
mov.b64 {%r1557, %r1558}, %rd1315; | |
shr.u32 %r1559, %r1558, 16; | |
shl.b32 %r1560, %r1557, 16; | |
shr.u32 %r1561, %r1557, 16; | |
shl.b32 %r1562, %r1558, 16; | |
or.b32 %r1563, %r1559, %r1560; | |
or.b32 %r1564, %r1561, %r1562; | |
mov.b64 %rd1316, {%r1564, %r1563}; | |
add.s64 %rd1317, %rd1316, %rd1309; | |
xor.b64 %rd1318, %rd1317, %rd1311; | |
mov.b64 {%r1565, %r1566}, %rd1318; | |
shr.u32 %r1567, %r1565, 31; | |
shl.b32 %r1568, %r1566, 1; | |
shr.u32 %r1569, %r1566, 31; | |
shl.b32 %r1570, %r1565, 1; | |
or.b32 %r1571, %r1567, %r1568; | |
or.b32 %r1572, %r1569, %r1570; | |
mov.b64 %rd1319, {%r1572, %r1571}; | |
ld.local.u64 %rd1320, [%rd107]; | |
add.s64 %rd1321, %rd1266, %rd1320; | |
add.s64 %rd1322, %rd1321, %rd1287; | |
xor.b64 %rd1323, %rd1322, %rd1316; | |
mov.b64 {%r1573, %r1574}, %rd1323; | |
mov.b64 %rd1324, {%r1574, %r1573}; | |
add.s64 %rd1325, %rd1324, %rd1301; | |
xor.b64 %rd1326, %rd1325, %rd1287; | |
mov.b64 {%r1575, %r1576}, %rd1326; | |
shr.u32 %r1577, %r1576, 24; | |
shl.b32 %r1578, %r1575, 8; | |
shr.u32 %r1579, %r1575, 24; | |
shl.b32 %r1580, %r1576, 8; | |
or.b32 %r1581, %r1577, %r1578; | |
or.b32 %r1582, %r1579, %r1580; | |
mov.b64 %rd1327, {%r1582, %r1581}; | |
ld.local.u64 %rd1328, [%rd108]; | |
add.s64 %rd1329, %rd1322, %rd1328; | |
add.s64 %rd1330, %rd1329, %rd1327; | |
xor.b64 %rd1331, %rd1330, %rd1324; | |
mov.b64 {%r1583, %r1584}, %rd1331; | |
shr.u32 %r1585, %r1584, 16; | |
shl.b32 %r1586, %r1583, 16; | |
shr.u32 %r1587, %r1583, 16; | |
shl.b32 %r1588, %r1584, 16; | |
or.b32 %r1589, %r1585, %r1586; | |
or.b32 %r1590, %r1587, %r1588; | |
mov.b64 %rd1332, {%r1590, %r1589}; | |
add.s64 %rd1333, %rd1332, %rd1325; | |
xor.b64 %rd1334, %rd1333, %rd1327; | |
mov.b64 {%r1591, %r1592}, %rd1334; | |
shr.u32 %r1593, %r1591, 31; | |
shl.b32 %r1594, %r1592, 1; | |
shr.u32 %r1595, %r1592, 31; | |
shl.b32 %r1596, %r1591, 1; | |
or.b32 %r1597, %r1593, %r1594; | |
or.b32 %r1598, %r1595, %r1596; | |
mov.b64 %rd1335, {%r1598, %r1597}; | |
ld.local.u64 %rd1336, [%rd109]; | |
add.s64 %rd1337, %rd1282, %rd1336; | |
add.s64 %rd1338, %rd1337, %rd1303; | |
xor.b64 %rd1339, %rd1338, %rd1268; | |
mov.b64 {%r1599, %r1600}, %rd1339; | |
mov.b64 %rd1340, {%r1600, %r1599}; | |
add.s64 %rd1341, %rd1340, %rd1317; | |
xor.b64 %rd1342, %rd1341, %rd1303; | |
mov.b64 {%r1601, %r1602}, %rd1342; | |
shr.u32 %r1603, %r1602, 24; | |
shl.b32 %r1604, %r1601, 8; | |
shr.u32 %r1605, %r1601, 24; | |
shl.b32 %r1606, %r1602, 8; | |
or.b32 %r1607, %r1603, %r1604; | |
or.b32 %r1608, %r1605, %r1606; | |
mov.b64 %rd1343, {%r1608, %r1607}; | |
ld.local.u64 %rd1344, [%rd110]; | |
add.s64 %rd1345, %rd1338, %rd1344; | |
add.s64 %rd1346, %rd1345, %rd1343; | |
xor.b64 %rd1347, %rd1346, %rd1340; | |
mov.b64 {%r1609, %r1610}, %rd1347; | |
shr.u32 %r1611, %r1610, 16; | |
shl.b32 %r1612, %r1609, 16; | |
shr.u32 %r1613, %r1609, 16; | |
shl.b32 %r1614, %r1610, 16; | |
or.b32 %r1615, %r1611, %r1612; | |
or.b32 %r1616, %r1613, %r1614; | |
mov.b64 %rd1348, {%r1616, %r1615}; | |
add.s64 %rd1349, %rd1348, %rd1341; | |
xor.b64 %rd1350, %rd1349, %rd1343; | |
mov.b64 {%r1617, %r1618}, %rd1350; | |
shr.u32 %r1619, %r1617, 31; | |
shl.b32 %r1620, %r1618, 1; | |
shr.u32 %r1621, %r1618, 31; | |
shl.b32 %r1622, %r1617, 1; | |
or.b32 %r1623, %r1619, %r1620; | |
or.b32 %r1624, %r1621, %r1622; | |
mov.b64 %rd1351, {%r1624, %r1623}; | |
ld.local.u64 %rd1352, [%rd111]; | |
add.s64 %rd1353, %rd1298, %rd1352; | |
add.s64 %rd1354, %rd1353, %rd1319; | |
xor.b64 %rd1355, %rd1354, %rd1284; | |
mov.b64 {%r1625, %r1626}, %rd1355; | |
mov.b64 %rd1356, {%r1626, %r1625}; | |
add.s64 %rd1357, %rd1356, %rd1269; | |
xor.b64 %rd1358, %rd1357, %rd1319; | |
mov.b64 {%r1627, %r1628}, %rd1358; | |
shr.u32 %r1629, %r1628, 24; | |
shl.b32 %r1630, %r1627, 8; | |
shr.u32 %r1631, %r1627, 24; | |
shl.b32 %r1632, %r1628, 8; | |
or.b32 %r1633, %r1629, %r1630; | |
or.b32 %r1634, %r1631, %r1632; | |
mov.b64 %rd1359, {%r1634, %r1633}; | |
ld.local.u64 %rd1360, [%rd112]; | |
add.s64 %rd1361, %rd1354, %rd1360; | |
add.s64 %rd1362, %rd1361, %rd1359; | |
xor.b64 %rd1363, %rd1362, %rd1356; | |
mov.b64 {%r1635, %r1636}, %rd1363; | |
shr.u32 %r1637, %r1636, 16; | |
shl.b32 %r1638, %r1635, 16; | |
shr.u32 %r1639, %r1635, 16; | |
shl.b32 %r1640, %r1636, 16; | |
or.b32 %r1641, %r1637, %r1638; | |
or.b32 %r1642, %r1639, %r1640; | |
mov.b64 %rd1364, {%r1642, %r1641}; | |
add.s64 %rd1365, %rd1364, %rd1357; | |
xor.b64 %rd1366, %rd1365, %rd1359; | |
mov.b64 {%r1643, %r1644}, %rd1366; | |
shr.u32 %r1645, %r1643, 31; | |
shl.b32 %r1646, %r1644, 1; | |
shr.u32 %r1647, %r1644, 31; | |
shl.b32 %r1648, %r1643, 1; | |
or.b32 %r1649, %r1645, %r1646; | |
or.b32 %r1650, %r1647, %r1648; | |
mov.b64 %rd1367, {%r1650, %r1649}; | |
ld.local.u64 %rd1368, [%rd113]; | |
add.s64 %rd1369, %rd1314, %rd1368; | |
add.s64 %rd1370, %rd1369, %rd1271; | |
xor.b64 %rd1371, %rd1370, %rd1300; | |
mov.b64 {%r1651, %r1652}, %rd1371; | |
mov.b64 %rd1372, {%r1652, %r1651}; | |
add.s64 %rd1373, %rd1372, %rd1285; | |
xor.b64 %rd1374, %rd1373, %rd1271; | |
mov.b64 {%r1653, %r1654}, %rd1374; | |
shr.u32 %r1655, %r1654, 24; | |
shl.b32 %r1656, %r1653, 8; | |
shr.u32 %r1657, %r1653, 24; | |
shl.b32 %r1658, %r1654, 8; | |
or.b32 %r1659, %r1655, %r1656; | |
or.b32 %r1660, %r1657, %r1658; | |
mov.b64 %rd1375, {%r1660, %r1659}; | |
ld.local.u64 %rd1376, [%rd114]; | |
add.s64 %rd1377, %rd1370, %rd1376; | |
add.s64 %rd1378, %rd1377, %rd1375; | |
xor.b64 %rd1379, %rd1378, %rd1372; | |
mov.b64 {%r1661, %r1662}, %rd1379; | |
shr.u32 %r1663, %r1662, 16; | |
shl.b32 %r1664, %r1661, 16; | |
shr.u32 %r1665, %r1661, 16; | |
shl.b32 %r1666, %r1662, 16; | |
or.b32 %r1667, %r1663, %r1664; | |
or.b32 %r1668, %r1665, %r1666; | |
mov.b64 %rd1380, {%r1668, %r1667}; | |
add.s64 %rd1381, %rd1380, %rd1373; | |
xor.b64 %rd1382, %rd1381, %rd1375; | |
mov.b64 {%r1669, %r1670}, %rd1382; | |
shr.u32 %r1671, %r1669, 31; | |
shl.b32 %r1672, %r1670, 1; | |
shr.u32 %r1673, %r1670, 31; | |
shl.b32 %r1674, %r1669, 1; | |
or.b32 %r1675, %r1671, %r1672; | |
or.b32 %r1676, %r1673, %r1674; | |
mov.b64 %rd1383, {%r1676, %r1675}; | |
ld.local.u64 %rd1384, [%rd115]; | |
add.s64 %rd1385, %rd1330, %rd1384; | |
add.s64 %rd1386, %rd1385, %rd1383; | |
xor.b64 %rd1387, %rd1386, %rd1348; | |
mov.b64 {%r1677, %r1678}, %rd1387; | |
mov.b64 %rd1388, {%r1678, %r1677}; | |
add.s64 %rd1389, %rd1388, %rd1365; | |
xor.b64 %rd1390, %rd1389, %rd1383; | |
mov.b64 {%r1679, %r1680}, %rd1390; | |
shr.u32 %r1681, %r1680, 24; | |
shl.b32 %r1682, %r1679, 8; | |
shr.u32 %r1683, %r1679, 24; | |
shl.b32 %r1684, %r1680, 8; | |
or.b32 %r1685, %r1681, %r1682; | |
or.b32 %r1686, %r1683, %r1684; | |
mov.b64 %rd1391, {%r1686, %r1685}; | |
ld.local.u64 %rd1392, [%rd116]; | |
add.s64 %rd1393, %rd1386, %rd1392; | |
add.s64 %rd1394, %rd1393, %rd1391; | |
xor.b64 %rd1395, %rd1394, %rd1388; | |
mov.b64 {%r1687, %r1688}, %rd1395; | |
shr.u32 %r1689, %r1688, 16; | |
shl.b32 %r1690, %r1687, 16; | |
shr.u32 %r1691, %r1687, 16; | |
shl.b32 %r1692, %r1688, 16; | |
or.b32 %r1693, %r1689, %r1690; | |
or.b32 %r1694, %r1691, %r1692; | |
mov.b64 %rd1396, {%r1694, %r1693}; | |
add.s64 %rd1397, %rd1396, %rd1389; | |
xor.b64 %rd1398, %rd1397, %rd1391; | |
mov.b64 {%r1695, %r1696}, %rd1398; | |
shr.u32 %r1697, %r1695, 31; | |
shl.b32 %r1698, %r1696, 1; | |
shr.u32 %r1699, %r1696, 31; | |
shl.b32 %r1700, %r1695, 1; | |
or.b32 %r1701, %r1697, %r1698; | |
or.b32 %r1702, %r1699, %r1700; | |
mov.b64 %rd1399, {%r1702, %r1701}; | |
ld.local.u64 %rd1400, [%rd117]; | |
add.s64 %rd1401, %rd1346, %rd1400; | |
add.s64 %rd1402, %rd1401, %rd1335; | |
xor.b64 %rd1403, %rd1402, %rd1364; | |
mov.b64 {%r1703, %r1704}, %rd1403; | |
mov.b64 %rd1404, {%r1704, %r1703}; | |
add.s64 %rd1405, %rd1404, %rd1381; | |
xor.b64 %rd1406, %rd1405, %rd1335; | |
mov.b64 {%r1705, %r1706}, %rd1406; | |
shr.u32 %r1707, %r1706, 24; | |
shl.b32 %r1708, %r1705, 8; | |
shr.u32 %r1709, %r1705, 24; | |
shl.b32 %r1710, %r1706, 8; | |
or.b32 %r1711, %r1707, %r1708; | |
or.b32 %r1712, %r1709, %r1710; | |
mov.b64 %rd1407, {%r1712, %r1711}; | |
ld.local.u64 %rd1408, [%rd118]; | |
add.s64 %rd1409, %rd1402, %rd1408; | |
add.s64 %rd1410, %rd1409, %rd1407; | |
xor.b64 %rd1411, %rd1410, %rd1404; | |
mov.b64 {%r1713, %r1714}, %rd1411; | |
shr.u32 %r1715, %r1714, 16; | |
shl.b32 %r1716, %r1713, 16; | |
shr.u32 %r1717, %r1713, 16; | |
shl.b32 %r1718, %r1714, 16; | |
or.b32 %r1719, %r1715, %r1716; | |
or.b32 %r1720, %r1717, %r1718; | |
mov.b64 %rd1412, {%r1720, %r1719}; | |
add.s64 %rd1413, %rd1412, %rd1405; | |
xor.b64 %rd1414, %rd1413, %rd1407; | |
mov.b64 {%r1721, %r1722}, %rd1414; | |
shr.u32 %r1723, %r1721, 31; | |
shl.b32 %r1724, %r1722, 1; | |
shr.u32 %r1725, %r1722, 31; | |
shl.b32 %r1726, %r1721, 1; | |
or.b32 %r1727, %r1723, %r1724; | |
or.b32 %r1728, %r1725, %r1726; | |
mov.b64 %rd1415, {%r1728, %r1727}; | |
ld.local.u64 %rd1416, [%rd119]; | |
add.s64 %rd1417, %rd1362, %rd1416; | |
add.s64 %rd1418, %rd1417, %rd1351; | |
xor.b64 %rd1419, %rd1418, %rd1380; | |
mov.b64 {%r1729, %r1730}, %rd1419; | |
mov.b64 %rd1420, {%r1730, %r1729}; | |
add.s64 %rd1421, %rd1420, %rd1333; | |
xor.b64 %rd1422, %rd1421, %rd1351; | |
mov.b64 {%r1731, %r1732}, %rd1422; | |
shr.u32 %r1733, %r1732, 24; | |
shl.b32 %r1734, %r1731, 8; | |
shr.u32 %r1735, %r1731, 24; | |
shl.b32 %r1736, %r1732, 8; | |
or.b32 %r1737, %r1733, %r1734; | |
or.b32 %r1738, %r1735, %r1736; | |
mov.b64 %rd1423, {%r1738, %r1737}; | |
ld.local.u64 %rd1424, [%rd120]; | |
add.s64 %rd1425, %rd1418, %rd1424; | |
add.s64 %rd1426, %rd1425, %rd1423; | |
xor.b64 %rd1427, %rd1426, %rd1420; | |
mov.b64 {%r1739, %r1740}, %rd1427; | |
shr.u32 %r1741, %r1740, 16; | |
shl.b32 %r1742, %r1739, 16; | |
shr.u32 %r1743, %r1739, 16; | |
shl.b32 %r1744, %r1740, 16; | |
or.b32 %r1745, %r1741, %r1742; | |
or.b32 %r1746, %r1743, %r1744; | |
mov.b64 %rd1428, {%r1746, %r1745}; | |
add.s64 %rd1429, %rd1428, %rd1421; | |
xor.b64 %rd1430, %rd1429, %rd1423; | |
mov.b64 {%r1747, %r1748}, %rd1430; | |
shr.u32 %r1749, %r1747, 31; | |
shl.b32 %r1750, %r1748, 1; | |
shr.u32 %r1751, %r1748, 31; | |
shl.b32 %r1752, %r1747, 1; | |
or.b32 %r1753, %r1749, %r1750; | |
or.b32 %r1754, %r1751, %r1752; | |
mov.b64 %rd1431, {%r1754, %r1753}; | |
ld.local.u64 %rd1432, [%rd121]; | |
add.s64 %rd1433, %rd1378, %rd1432; | |
add.s64 %rd1434, %rd1433, %rd1367; | |
xor.b64 %rd1435, %rd1434, %rd1332; | |
mov.b64 {%r1755, %r1756}, %rd1435; | |
mov.b64 %rd1436, {%r1756, %r1755}; | |
add.s64 %rd1437, %rd1436, %rd1349; | |
xor.b64 %rd1438, %rd1437, %rd1367; | |
mov.b64 {%r1757, %r1758}, %rd1438; | |
shr.u32 %r1759, %r1758, 24; | |
shl.b32 %r1760, %r1757, 8; | |
shr.u32 %r1761, %r1757, 24; | |
shl.b32 %r1762, %r1758, 8; | |
or.b32 %r1763, %r1759, %r1760; | |
or.b32 %r1764, %r1761, %r1762; | |
mov.b64 %rd1439, {%r1764, %r1763}; | |
ld.local.u64 %rd1440, [%rd122]; | |
add.s64 %rd1441, %rd1434, %rd1440; | |
add.s64 %rd1442, %rd1441, %rd1439; | |
xor.b64 %rd1443, %rd1442, %rd1436; | |
mov.b64 {%r1765, %r1766}, %rd1443; | |
shr.u32 %r1767, %r1766, 16; | |
shl.b32 %r1768, %r1765, 16; | |
shr.u32 %r1769, %r1765, 16; | |
shl.b32 %r1770, %r1766, 16; | |
or.b32 %r1771, %r1767, %r1768; | |
or.b32 %r1772, %r1769, %r1770; | |
mov.b64 %rd1444, {%r1772, %r1771}; | |
add.s64 %rd1445, %rd1444, %rd1437; | |
xor.b64 %rd1446, %rd1445, %rd1439; | |
mov.b64 {%r1773, %r1774}, %rd1446; | |
shr.u32 %r1775, %r1773, 31; | |
shl.b32 %r1776, %r1774, 1; | |
shr.u32 %r1777, %r1774, 31; | |
shl.b32 %r1778, %r1773, 1; | |
or.b32 %r1779, %r1775, %r1776; | |
or.b32 %r1780, %r1777, %r1778; | |
mov.b64 %rd1447, {%r1780, %r1779}; | |
ld.local.u64 %rd1448, [%rd123]; | |
add.s64 %rd1449, %rd1394, %rd1448; | |
add.s64 %rd1450, %rd1449, %rd1415; | |
xor.b64 %rd1451, %rd1450, %rd1444; | |
mov.b64 {%r1781, %r1782}, %rd1451; | |
mov.b64 %rd1452, {%r1782, %r1781}; | |
add.s64 %rd1453, %rd1452, %rd1429; | |
xor.b64 %rd1454, %rd1453, %rd1415; | |
mov.b64 {%r1783, %r1784}, %rd1454; | |
shr.u32 %r1785, %r1784, 24; | |
shl.b32 %r1786, %r1783, 8; | |
shr.u32 %r1787, %r1783, 24; | |
shl.b32 %r1788, %r1784, 8; | |
or.b32 %r1789, %r1785, %r1786; | |
or.b32 %r1790, %r1787, %r1788; | |
mov.b64 %rd1455, {%r1790, %r1789}; | |
ld.local.u64 %rd1456, [%rd124]; | |
add.s64 %rd1457, %rd1450, %rd1456; | |
add.s64 %rd1458, %rd1457, %rd1455; | |
xor.b64 %rd1459, %rd1458, %rd1452; | |
mov.b64 {%r1791, %r1792}, %rd1459; | |
shr.u32 %r1793, %r1792, 16; | |
shl.b32 %r1794, %r1791, 16; | |
shr.u32 %r1795, %r1791, 16; | |
shl.b32 %r1796, %r1792, 16; | |
or.b32 %r1797, %r1793, %r1794; | |
or.b32 %r1798, %r1795, %r1796; | |
mov.b64 %rd1460, {%r1798, %r1797}; | |
add.s64 %rd1461, %rd1460, %rd1453; | |
xor.b64 %rd1462, %rd1461, %rd1455; | |
mov.b64 {%r1799, %r1800}, %rd1462; | |
shr.u32 %r1801, %r1799, 31; | |
shl.b32 %r1802, %r1800, 1; | |
shr.u32 %r1803, %r1800, 31; | |
shl.b32 %r1804, %r1799, 1; | |
or.b32 %r1805, %r1801, %r1802; | |
or.b32 %r1806, %r1803, %r1804; | |
mov.b64 %rd1463, {%r1806, %r1805}; | |
ld.local.u64 %rd1464, [%rd125]; | |
add.s64 %rd1465, %rd1410, %rd1464; | |
add.s64 %rd1466, %rd1465, %rd1431; | |
xor.b64 %rd1467, %rd1466, %rd1396; | |
mov.b64 {%r1807, %r1808}, %rd1467; | |
mov.b64 %rd1468, {%r1808, %r1807}; | |
add.s64 %rd1469, %rd1468, %rd1445; | |
xor.b64 %rd1470, %rd1469, %rd1431; | |
mov.b64 {%r1809, %r1810}, %rd1470; | |
shr.u32 %r1811, %r1810, 24; | |
shl.b32 %r1812, %r1809, 8; | |
shr.u32 %r1813, %r1809, 24; | |
shl.b32 %r1814, %r1810, 8; | |
or.b32 %r1815, %r1811, %r1812; | |
or.b32 %r1816, %r1813, %r1814; | |
mov.b64 %rd1471, {%r1816, %r1815}; | |
ld.local.u64 %rd1472, [%rd126]; | |
add.s64 %rd1473, %rd1466, %rd1472; | |
add.s64 %rd1474, %rd1473, %rd1471; | |
xor.b64 %rd1475, %rd1474, %rd1468; | |
mov.b64 {%r1817, %r1818}, %rd1475; | |
shr.u32 %r1819, %r1818, 16; | |
shl.b32 %r1820, %r1817, 16; | |
shr.u32 %r1821, %r1817, 16; | |
shl.b32 %r1822, %r1818, 16; | |
or.b32 %r1823, %r1819, %r1820; | |
or.b32 %r1824, %r1821, %r1822; | |
mov.b64 %rd1476, {%r1824, %r1823}; | |
add.s64 %rd1477, %rd1476, %rd1469; | |
xor.b64 %rd1478, %rd1477, %rd1471; | |
mov.b64 {%r1825, %r1826}, %rd1478; | |
shr.u32 %r1827, %r1825, 31; | |
shl.b32 %r1828, %r1826, 1; | |
shr.u32 %r1829, %r1826, 31; | |
shl.b32 %r1830, %r1825, 1; | |
or.b32 %r1831, %r1827, %r1828; | |
or.b32 %r1832, %r1829, %r1830; | |
mov.b64 %rd1479, {%r1832, %r1831}; | |
ld.local.u64 %rd1480, [%rd127]; | |
add.s64 %rd1481, %rd1426, %rd1480; | |
add.s64 %rd1482, %rd1481, %rd1447; | |
xor.b64 %rd1483, %rd1482, %rd1412; | |
mov.b64 {%r1833, %r1834}, %rd1483; | |
mov.b64 %rd1484, {%r1834, %r1833}; | |
add.s64 %rd1485, %rd1484, %rd1397; | |
xor.b64 %rd1486, %rd1485, %rd1447; | |
mov.b64 {%r1835, %r1836}, %rd1486; | |
shr.u32 %r1837, %r1836, 24; | |
shl.b32 %r1838, %r1835, 8; | |
shr.u32 %r1839, %r1835, 24; | |
shl.b32 %r1840, %r1836, 8; | |
or.b32 %r1841, %r1837, %r1838; | |
or.b32 %r1842, %r1839, %r1840; | |
mov.b64 %rd1487, {%r1842, %r1841}; | |
ld.local.u64 %rd1488, [%rd128]; | |
add.s64 %rd1489, %rd1482, %rd1488; | |
add.s64 %rd1490, %rd1489, %rd1487; | |
xor.b64 %rd1491, %rd1490, %rd1484; | |
mov.b64 {%r1843, %r1844}, %rd1491; | |
shr.u32 %r1845, %r1844, 16; | |
shl.b32 %r1846, %r1843, 16; | |
shr.u32 %r1847, %r1843, 16; | |
shl.b32 %r1848, %r1844, 16; | |
or.b32 %r1849, %r1845, %r1846; | |
or.b32 %r1850, %r1847, %r1848; | |
mov.b64 %rd1492, {%r1850, %r1849}; | |
add.s64 %rd1493, %rd1492, %rd1485; | |
xor.b64 %rd1494, %rd1493, %rd1487; | |
mov.b64 {%r1851, %r1852}, %rd1494; | |
shr.u32 %r1853, %r1851, 31; | |
shl.b32 %r1854, %r1852, 1; | |
shr.u32 %r1855, %r1852, 31; | |
shl.b32 %r1856, %r1851, 1; | |
or.b32 %r1857, %r1853, %r1854; | |
or.b32 %r1858, %r1855, %r1856; | |
mov.b64 %rd1495, {%r1858, %r1857}; | |
ld.local.u64 %rd1496, [%rd129]; | |
add.s64 %rd1497, %rd1442, %rd1496; | |
add.s64 %rd1498, %rd1497, %rd1399; | |
xor.b64 %rd1499, %rd1498, %rd1428; | |
mov.b64 {%r1859, %r1860}, %rd1499; | |
mov.b64 %rd1500, {%r1860, %r1859}; | |
add.s64 %rd1501, %rd1500, %rd1413; | |
xor.b64 %rd1502, %rd1501, %rd1399; | |
mov.b64 {%r1861, %r1862}, %rd1502; | |
shr.u32 %r1863, %r1862, 24; | |
shl.b32 %r1864, %r1861, 8; | |
shr.u32 %r1865, %r1861, 24; | |
shl.b32 %r1866, %r1862, 8; | |
or.b32 %r1867, %r1863, %r1864; | |
or.b32 %r1868, %r1865, %r1866; | |
mov.b64 %rd1503, {%r1868, %r1867}; | |
ld.local.u64 %rd1504, [%rd130]; | |
add.s64 %rd1505, %rd1498, %rd1504; | |
add.s64 %rd1506, %rd1505, %rd1503; | |
xor.b64 %rd1507, %rd1506, %rd1500; | |
mov.b64 {%r1869, %r1870}, %rd1507; | |
shr.u32 %r1871, %r1870, 16; | |
shl.b32 %r1872, %r1869, 16; | |
shr.u32 %r1873, %r1869, 16; | |
shl.b32 %r1874, %r1870, 16; | |
or.b32 %r1875, %r1871, %r1872; | |
or.b32 %r1876, %r1873, %r1874; | |
mov.b64 %rd1508, {%r1876, %r1875}; | |
add.s64 %rd1509, %rd1508, %rd1501; | |
xor.b64 %rd1510, %rd1509, %rd1503; | |
mov.b64 {%r1877, %r1878}, %rd1510; | |
shr.u32 %r1879, %r1877, 31; | |
shl.b32 %r1880, %r1878, 1; | |
shr.u32 %r1881, %r1878, 31; | |
shl.b32 %r1882, %r1877, 1; | |
or.b32 %r1883, %r1879, %r1880; | |
or.b32 %r1884, %r1881, %r1882; | |
mov.b64 %rd1511, {%r1884, %r1883}; | |
ld.local.u64 %rd1512, [%rd131]; | |
add.s64 %rd1513, %rd1458, %rd1512; | |
add.s64 %rd1514, %rd1513, %rd1511; | |
xor.b64 %rd1515, %rd1514, %rd1476; | |
mov.b64 {%r1885, %r1886}, %rd1515; | |
mov.b64 %rd1516, {%r1886, %r1885}; | |
add.s64 %rd1517, %rd1516, %rd1493; | |
xor.b64 %rd1518, %rd1517, %rd1511; | |
mov.b64 {%r1887, %r1888}, %rd1518; | |
shr.u32 %r1889, %r1888, 24; | |
shl.b32 %r1890, %r1887, 8; | |
shr.u32 %r1891, %r1887, 24; | |
shl.b32 %r1892, %r1888, 8; | |
or.b32 %r1893, %r1889, %r1890; | |
or.b32 %r1894, %r1891, %r1892; | |
mov.b64 %rd1519, {%r1894, %r1893}; | |
ld.local.u64 %rd1520, [%rd132]; | |
add.s64 %rd1521, %rd1514, %rd1520; | |
add.s64 %rd1522, %rd1521, %rd1519; | |
xor.b64 %rd1523, %rd1522, %rd1516; | |
mov.b64 {%r1895, %r1896}, %rd1523; | |
shr.u32 %r1897, %r1896, 16; | |
shl.b32 %r1898, %r1895, 16; | |
shr.u32 %r1899, %r1895, 16; | |
shl.b32 %r1900, %r1896, 16; | |
or.b32 %r1901, %r1897, %r1898; | |
or.b32 %r1902, %r1899, %r1900; | |
mov.b64 %rd1524, {%r1902, %r1901}; | |
add.s64 %rd1525, %rd1524, %rd1517; | |
xor.b64 %rd1526, %rd1525, %rd1519; | |
mov.b64 {%r1903, %r1904}, %rd1526; | |
shr.u32 %r1905, %r1903, 31; | |
shl.b32 %r1906, %r1904, 1; | |
shr.u32 %r1907, %r1904, 31; | |
shl.b32 %r1908, %r1903, 1; | |
or.b32 %r1909, %r1905, %r1906; | |
or.b32 %r1910, %r1907, %r1908; | |
mov.b64 %rd1527, {%r1910, %r1909}; | |
ld.local.u64 %rd1528, [%rd133]; | |
add.s64 %rd1529, %rd1474, %rd1528; | |
add.s64 %rd1530, %rd1529, %rd1463; | |
xor.b64 %rd1531, %rd1530, %rd1492; | |
mov.b64 {%r1911, %r1912}, %rd1531; | |
mov.b64 %rd1532, {%r1912, %r1911}; | |
add.s64 %rd1533, %rd1532, %rd1509; | |
xor.b64 %rd1534, %rd1533, %rd1463; | |
mov.b64 {%r1913, %r1914}, %rd1534; | |
shr.u32 %r1915, %r1914, 24; | |
shl.b32 %r1916, %r1913, 8; | |
shr.u32 %r1917, %r1913, 24; | |
shl.b32 %r1918, %r1914, 8; | |
or.b32 %r1919, %r1915, %r1916; | |
or.b32 %r1920, %r1917, %r1918; | |
mov.b64 %rd1535, {%r1920, %r1919}; | |
ld.local.u64 %rd1536, [%rd134]; | |
add.s64 %rd1537, %rd1530, %rd1536; | |
add.s64 %rd1538, %rd1537, %rd1535; | |
xor.b64 %rd1539, %rd1538, %rd1532; | |
mov.b64 {%r1921, %r1922}, %rd1539; | |
shr.u32 %r1923, %r1922, 16; | |
shl.b32 %r1924, %r1921, 16; | |
shr.u32 %r1925, %r1921, 16; | |
shl.b32 %r1926, %r1922, 16; | |
or.b32 %r1927, %r1923, %r1924; | |
or.b32 %r1928, %r1925, %r1926; | |
mov.b64 %rd1540, {%r1928, %r1927}; | |
add.s64 %rd1541, %rd1540, %rd1533; | |
xor.b64 %rd1542, %rd1541, %rd1535; | |
mov.b64 {%r1929, %r1930}, %rd1542; | |
shr.u32 %r1931, %r1929, 31; | |
shl.b32 %r1932, %r1930, 1; | |
shr.u32 %r1933, %r1930, 31; | |
shl.b32 %r1934, %r1929, 1; | |
or.b32 %r1935, %r1931, %r1932; | |
or.b32 %r1936, %r1933, %r1934; | |
mov.b64 %rd1543, {%r1936, %r1935}; | |
ld.local.u64 %rd1544, [%rd135]; | |
add.s64 %rd1545, %rd1490, %rd1544; | |
add.s64 %rd1546, %rd1545, %rd1479; | |
xor.b64 %rd1547, %rd1546, %rd1508; | |
mov.b64 {%r1937, %r1938}, %rd1547; | |
mov.b64 %rd1548, {%r1938, %r1937}; | |
add.s64 %rd1549, %rd1548, %rd1461; | |
xor.b64 %rd1550, %rd1549, %rd1479; | |
mov.b64 {%r1939, %r1940}, %rd1550; | |
shr.u32 %r1941, %r1940, 24; | |
shl.b32 %r1942, %r1939, 8; | |
shr.u32 %r1943, %r1939, 24; | |
shl.b32 %r1944, %r1940, 8; | |
or.b32 %r1945, %r1941, %r1942; | |
or.b32 %r1946, %r1943, %r1944; | |
mov.b64 %rd1551, {%r1946, %r1945}; | |
ld.local.u64 %rd1552, [%rd136]; | |
add.s64 %rd1553, %rd1546, %rd1552; | |
add.s64 %rd1554, %rd1553, %rd1551; | |
xor.b64 %rd1555, %rd1554, %rd1548; | |
mov.b64 {%r1947, %r1948}, %rd1555; | |
shr.u32 %r1949, %r1948, 16; | |
shl.b32 %r1950, %r1947, 16; | |
shr.u32 %r1951, %r1947, 16; | |
shl.b32 %r1952, %r1948, 16; | |
or.b32 %r1953, %r1949, %r1950; | |
or.b32 %r1954, %r1951, %r1952; | |
mov.b64 %rd1556, {%r1954, %r1953}; | |
add.s64 %rd1557, %rd1556, %rd1549; | |
xor.b64 %rd1558, %rd1557, %rd1551; | |
mov.b64 {%r1955, %r1956}, %rd1558; | |
shr.u32 %r1957, %r1955, 31; | |
shl.b32 %r1958, %r1956, 1; | |
shr.u32 %r1959, %r1956, 31; | |
shl.b32 %r1960, %r1955, 1; | |
or.b32 %r1961, %r1957, %r1958; | |
or.b32 %r1962, %r1959, %r1960; | |
mov.b64 %rd1559, {%r1962, %r1961}; | |
ld.local.u64 %rd1560, [%rd137]; | |
add.s64 %rd1561, %rd1506, %rd1560; | |
add.s64 %rd1562, %rd1561, %rd1495; | |
xor.b64 %rd1563, %rd1562, %rd1460; | |
mov.b64 {%r1963, %r1964}, %rd1563; | |
mov.b64 %rd1564, {%r1964, %r1963}; | |
add.s64 %rd1565, %rd1564, %rd1477; | |
xor.b64 %rd1566, %rd1565, %rd1495; | |
mov.b64 {%r1965, %r1966}, %rd1566; | |
shr.u32 %r1967, %r1966, 24; | |
shl.b32 %r1968, %r1965, 8; | |
shr.u32 %r1969, %r1965, 24; | |
shl.b32 %r1970, %r1966, 8; | |
or.b32 %r1971, %r1967, %r1968; | |
or.b32 %r1972, %r1969, %r1970; | |
mov.b64 %rd1567, {%r1972, %r1971}; | |
ld.local.u64 %rd1568, [%rd138]; | |
add.s64 %rd1569, %rd1562, %rd1568; | |
add.s64 %rd1570, %rd1569, %rd1567; | |
xor.b64 %rd1571, %rd1570, %rd1564; | |
mov.b64 {%r1973, %r1974}, %rd1571; | |
shr.u32 %r1975, %r1974, 16; | |
shl.b32 %r1976, %r1973, 16; | |
shr.u32 %r1977, %r1973, 16; | |
shl.b32 %r1978, %r1974, 16; | |
or.b32 %r1979, %r1975, %r1976; | |
or.b32 %r1980, %r1977, %r1978; | |
mov.b64 %rd1572, {%r1980, %r1979}; | |
add.s64 %rd1573, %rd1572, %rd1565; | |
xor.b64 %rd1574, %rd1573, %rd1567; | |
mov.b64 {%r1981, %r1982}, %rd1574; | |
shr.u32 %r1983, %r1981, 31; | |
shl.b32 %r1984, %r1982, 1; | |
shr.u32 %r1985, %r1982, 31; | |
shl.b32 %r1986, %r1981, 1; | |
or.b32 %r1987, %r1983, %r1984; | |
or.b32 %r1988, %r1985, %r1986; | |
mov.b64 %rd1575, {%r1988, %r1987}; | |
ld.local.u64 %rd1576, [%rd139]; | |
add.s64 %rd1577, %rd1522, %rd1576; | |
add.s64 %rd1578, %rd1577, %rd1543; | |
xor.b64 %rd1579, %rd1578, %rd1572; | |
mov.b64 {%r1989, %r1990}, %rd1579; | |
mov.b64 %rd1580, {%r1990, %r1989}; | |
add.s64 %rd1581, %rd1580, %rd1557; | |
xor.b64 %rd1582, %rd1581, %rd1543; | |
mov.b64 {%r1991, %r1992}, %rd1582; | |
shr.u32 %r1993, %r1992, 24; | |
shl.b32 %r1994, %r1991, 8; | |
shr.u32 %r1995, %r1991, 24; | |
shl.b32 %r1996, %r1992, 8; | |
or.b32 %r1997, %r1993, %r1994; | |
or.b32 %r1998, %r1995, %r1996; | |
mov.b64 %rd1583, {%r1998, %r1997}; | |
ld.local.u64 %rd1584, [%rd140]; | |
add.s64 %rd1585, %rd1578, %rd1584; | |
add.s64 %rd1586, %rd1585, %rd1583; | |
xor.b64 %rd1587, %rd1586, %rd1580; | |
mov.b64 {%r1999, %r2000}, %rd1587; | |
shr.u32 %r2001, %r2000, 16; | |
shl.b32 %r2002, %r1999, 16; | |
shr.u32 %r2003, %r1999, 16; | |
shl.b32 %r2004, %r2000, 16; | |
or.b32 %r2005, %r2001, %r2002; | |
or.b32 %r2006, %r2003, %r2004; | |
mov.b64 %rd1588, {%r2006, %r2005}; | |
add.s64 %rd1589, %rd1588, %rd1581; | |
xor.b64 %rd1590, %rd1589, %rd1583; | |
mov.b64 {%r2007, %r2008}, %rd1590; | |
shr.u32 %r2009, %r2007, 31; | |
shl.b32 %r2010, %r2008, 1; | |
shr.u32 %r2011, %r2008, 31; | |
shl.b32 %r2012, %r2007, 1; | |
or.b32 %r2013, %r2009, %r2010; | |
or.b32 %r2014, %r2011, %r2012; | |
mov.b64 %rd1591, {%r2014, %r2013}; | |
ld.local.u64 %rd1592, [%rd141]; | |
add.s64 %rd1593, %rd1538, %rd1592; | |
add.s64 %rd1594, %rd1593, %rd1559; | |
xor.b64 %rd1595, %rd1594, %rd1524; | |
mov.b64 {%r2015, %r2016}, %rd1595; | |
mov.b64 %rd1596, {%r2016, %r2015}; | |
add.s64 %rd1597, %rd1596, %rd1573; | |
xor.b64 %rd1598, %rd1597, %rd1559; | |
mov.b64 {%r2017, %r2018}, %rd1598; | |
shr.u32 %r2019, %r2018, 24; | |
shl.b32 %r2020, %r2017, 8; | |
shr.u32 %r2021, %r2017, 24; | |
shl.b32 %r2022, %r2018, 8; | |
or.b32 %r2023, %r2019, %r2020; | |
or.b32 %r2024, %r2021, %r2022; | |
mov.b64 %rd1599, {%r2024, %r2023}; | |
ld.local.u64 %rd1600, [%rd142]; | |
add.s64 %rd1601, %rd1594, %rd1600; | |
add.s64 %rd1602, %rd1601, %rd1599; | |
xor.b64 %rd1603, %rd1602, %rd1596; | |
mov.b64 {%r2025, %r2026}, %rd1603; | |
shr.u32 %r2027, %r2026, 16; | |
shl.b32 %r2028, %r2025, 16; | |
shr.u32 %r2029, %r2025, 16; | |
shl.b32 %r2030, %r2026, 16; | |
or.b32 %r2031, %r2027, %r2028; | |
or.b32 %r2032, %r2029, %r2030; | |
mov.b64 %rd1604, {%r2032, %r2031}; | |
add.s64 %rd1605, %rd1604, %rd1597; | |
xor.b64 %rd1606, %rd1605, %rd1599; | |
mov.b64 {%r2033, %r2034}, %rd1606; | |
shr.u32 %r2035, %r2033, 31; | |
shl.b32 %r2036, %r2034, 1; | |
shr.u32 %r2037, %r2034, 31; | |
shl.b32 %r2038, %r2033, 1; | |
or.b32 %r2039, %r2035, %r2036; | |
or.b32 %r2040, %r2037, %r2038; | |
mov.b64 %rd1607, {%r2040, %r2039}; | |
ld.local.u64 %rd1608, [%rd143]; | |
add.s64 %rd1609, %rd1554, %rd1608; | |
add.s64 %rd1610, %rd1609, %rd1575; | |
xor.b64 %rd1611, %rd1610, %rd1540; | |
mov.b64 {%r2041, %r2042}, %rd1611; | |
mov.b64 %rd1612, {%r2042, %r2041}; | |
add.s64 %rd1613, %rd1612, %rd1525; | |
xor.b64 %rd1614, %rd1613, %rd1575; | |
mov.b64 {%r2043, %r2044}, %rd1614; | |
shr.u32 %r2045, %r2044, 24; | |
shl.b32 %r2046, %r2043, 8; | |
shr.u32 %r2047, %r2043, 24; | |
shl.b32 %r2048, %r2044, 8; | |
or.b32 %r2049, %r2045, %r2046; | |
or.b32 %r2050, %r2047, %r2048; | |
mov.b64 %rd1615, {%r2050, %r2049}; | |
ld.local.u64 %rd1616, [%rd144]; | |
add.s64 %rd1617, %rd1610, %rd1616; | |
add.s64 %rd1618, %rd1617, %rd1615; | |
xor.b64 %rd1619, %rd1618, %rd1612; | |
mov.b64 {%r2051, %r2052}, %rd1619; | |
shr.u32 %r2053, %r2052, 16; | |
shl.b32 %r2054, %r2051, 16; | |
shr.u32 %r2055, %r2051, 16; | |
shl.b32 %r2056, %r2052, 16; | |
or.b32 %r2057, %r2053, %r2054; | |
or.b32 %r2058, %r2055, %r2056; | |
mov.b64 %rd1620, {%r2058, %r2057}; | |
add.s64 %rd1621, %rd1620, %rd1613; | |
xor.b64 %rd1622, %rd1621, %rd1615; | |
mov.b64 {%r2059, %r2060}, %rd1622; | |
shr.u32 %r2061, %r2059, 31; | |
shl.b32 %r2062, %r2060, 1; | |
shr.u32 %r2063, %r2060, 31; | |
shl.b32 %r2064, %r2059, 1; | |
or.b32 %r2065, %r2061, %r2062; | |
or.b32 %r2066, %r2063, %r2064; | |
mov.b64 %rd1623, {%r2066, %r2065}; | |
ld.local.u64 %rd1624, [%rd145]; | |
add.s64 %rd1625, %rd1570, %rd1624; | |
add.s64 %rd1626, %rd1625, %rd1527; | |
xor.b64 %rd1627, %rd1626, %rd1556; | |
mov.b64 {%r2067, %r2068}, %rd1627; | |
mov.b64 %rd1628, {%r2068, %r2067}; | |
add.s64 %rd1629, %rd1628, %rd1541; | |
xor.b64 %rd1630, %rd1629, %rd1527; | |
mov.b64 {%r2069, %r2070}, %rd1630; | |
shr.u32 %r2071, %r2070, 24; | |
shl.b32 %r2072, %r2069, 8; | |
shr.u32 %r2073, %r2069, 24; | |
shl.b32 %r2074, %r2070, 8; | |
or.b32 %r2075, %r2071, %r2072; | |
or.b32 %r2076, %r2073, %r2074; | |
mov.b64 %rd1631, {%r2076, %r2075}; | |
ld.local.u64 %rd1632, [%rd146]; | |
add.s64 %rd1633, %rd1626, %rd1632; | |
add.s64 %rd1634, %rd1633, %rd1631; | |
xor.b64 %rd1635, %rd1634, %rd1628; | |
mov.b64 {%r2077, %r2078}, %rd1635; | |
shr.u32 %r2079, %r2078, 16; | |
shl.b32 %r2080, %r2077, 16; | |
shr.u32 %r2081, %r2077, 16; | |
shl.b32 %r2082, %r2078, 16; | |
or.b32 %r2083, %r2079, %r2080; | |
or.b32 %r2084, %r2081, %r2082; | |
mov.b64 %rd1636, {%r2084, %r2083}; | |
add.s64 %rd1637, %rd1636, %rd1629; | |
xor.b64 %rd1638, %rd1637, %rd1631; | |
mov.b64 {%r2085, %r2086}, %rd1638; | |
shr.u32 %r2087, %r2085, 31; | |
shl.b32 %r2088, %r2086, 1; | |
shr.u32 %r2089, %r2086, 31; | |
shl.b32 %r2090, %r2085, 1; | |
or.b32 %r2091, %r2087, %r2088; | |
or.b32 %r2092, %r2089, %r2090; | |
mov.b64 %rd1639, {%r2092, %r2091}; | |
ld.local.u64 %rd1640, [%rd147]; | |
add.s64 %rd1641, %rd1586, %rd1640; | |
add.s64 %rd1642, %rd1641, %rd1639; | |
xor.b64 %rd1643, %rd1642, %rd1604; | |
mov.b64 {%r2093, %r2094}, %rd1643; | |
mov.b64 %rd1644, {%r2094, %r2093}; | |
add.s64 %rd1645, %rd1644, %rd1621; | |
xor.b64 %rd1646, %rd1645, %rd1639; | |
mov.b64 {%r2095, %r2096}, %rd1646; | |
shr.u32 %r2097, %r2096, 24; | |
shl.b32 %r2098, %r2095, 8; | |
shr.u32 %r2099, %r2095, 24; | |
shl.b32 %r2100, %r2096, 8; | |
or.b32 %r2101, %r2097, %r2098; | |
or.b32 %r2102, %r2099, %r2100; | |
mov.b64 %rd1647, {%r2102, %r2101}; | |
ld.local.u64 %rd1648, [%rd148]; | |
add.s64 %rd1649, %rd1642, %rd1648; | |
add.s64 %rd1650, %rd1649, %rd1647; | |
xor.b64 %rd1651, %rd1650, %rd1644; | |
mov.b64 {%r2103, %r2104}, %rd1651; | |
shr.u32 %r2105, %r2104, 16; | |
shl.b32 %r2106, %r2103, 16; | |
shr.u32 %r2107, %r2103, 16; | |
shl.b32 %r2108, %r2104, 16; | |
or.b32 %r2109, %r2105, %r2106; | |
or.b32 %r2110, %r2107, %r2108; | |
mov.b64 %rd1652, {%r2110, %r2109}; | |
add.s64 %rd1653, %rd1652, %rd1645; | |
xor.b64 %rd1654, %rd1653, %rd1647; | |
mov.b64 {%r2111, %r2112}, %rd1654; | |
shr.u32 %r2113, %r2111, 31; | |
shl.b32 %r2114, %r2112, 1; | |
shr.u32 %r2115, %r2112, 31; | |
shl.b32 %r2116, %r2111, 1; | |
or.b32 %r2117, %r2113, %r2114; | |
or.b32 %r2118, %r2115, %r2116; | |
mov.b64 %rd1655, {%r2118, %r2117}; | |
ld.local.u64 %rd1656, [%rd149]; | |
add.s64 %rd1657, %rd1602, %rd1656; | |
add.s64 %rd1658, %rd1657, %rd1591; | |
xor.b64 %rd1659, %rd1658, %rd1620; | |
mov.b64 {%r2119, %r2120}, %rd1659; | |
mov.b64 %rd1660, {%r2120, %r2119}; | |
add.s64 %rd1661, %rd1660, %rd1637; | |
xor.b64 %rd1662, %rd1661, %rd1591; | |
mov.b64 {%r2121, %r2122}, %rd1662; | |
shr.u32 %r2123, %r2122, 24; | |
shl.b32 %r2124, %r2121, 8; | |
shr.u32 %r2125, %r2121, 24; | |
shl.b32 %r2126, %r2122, 8; | |
or.b32 %r2127, %r2123, %r2124; | |
or.b32 %r2128, %r2125, %r2126; | |
mov.b64 %rd1663, {%r2128, %r2127}; | |
ld.local.u64 %rd1664, [%rd150]; | |
add.s64 %rd1665, %rd1658, %rd1664; | |
add.s64 %rd1666, %rd1665, %rd1663; | |
xor.b64 %rd1667, %rd1666, %rd1660; | |
mov.b64 {%r2129, %r2130}, %rd1667; | |
shr.u32 %r2131, %r2130, 16; | |
shl.b32 %r2132, %r2129, 16; | |
shr.u32 %r2133, %r2129, 16; | |
shl.b32 %r2134, %r2130, 16; | |
or.b32 %r2135, %r2131, %r2132; | |
or.b32 %r2136, %r2133, %r2134; | |
mov.b64 %rd1668, {%r2136, %r2135}; | |
add.s64 %rd1669, %rd1668, %rd1661; | |
xor.b64 %rd1670, %rd1669, %rd1663; | |
mov.b64 {%r2137, %r2138}, %rd1670; | |
shr.u32 %r2139, %r2137, 31; | |
shl.b32 %r2140, %r2138, 1; | |
shr.u32 %r2141, %r2138, 31; | |
shl.b32 %r2142, %r2137, 1; | |
or.b32 %r2143, %r2139, %r2140; | |
or.b32 %r2144, %r2141, %r2142; | |
mov.b64 %rd1671, {%r2144, %r2143}; | |
ld.local.u64 %rd1672, [%rd151]; | |
add.s64 %rd1673, %rd1618, %rd1672; | |
add.s64 %rd1674, %rd1673, %rd1607; | |
xor.b64 %rd1675, %rd1674, %rd1636; | |
mov.b64 {%r2145, %r2146}, %rd1675; | |
mov.b64 %rd1676, {%r2146, %r2145}; | |
add.s64 %rd1677, %rd1676, %rd1589; | |
xor.b64 %rd1678, %rd1677, %rd1607; | |
mov.b64 {%r2147, %r2148}, %rd1678; | |
shr.u32 %r2149, %r2148, 24; | |
shl.b32 %r2150, %r2147, 8; | |
shr.u32 %r2151, %r2147, 24; | |
shl.b32 %r2152, %r2148, 8; | |
or.b32 %r2153, %r2149, %r2150; | |
or.b32 %r2154, %r2151, %r2152; | |
mov.b64 %rd1679, {%r2154, %r2153}; | |
ld.local.u64 %rd1680, [%rd152]; | |
add.s64 %rd1681, %rd1674, %rd1680; | |
add.s64 %rd1682, %rd1681, %rd1679; | |
xor.b64 %rd1683, %rd1682, %rd1676; | |
mov.b64 {%r2155, %r2156}, %rd1683; | |
shr.u32 %r2157, %r2156, 16; | |
shl.b32 %r2158, %r2155, 16; | |
shr.u32 %r2159, %r2155, 16; | |
shl.b32 %r2160, %r2156, 16; | |
or.b32 %r2161, %r2157, %r2158; | |
or.b32 %r2162, %r2159, %r2160; | |
mov.b64 %rd1684, {%r2162, %r2161}; | |
add.s64 %rd1685, %rd1684, %rd1677; | |
xor.b64 %rd1686, %rd1685, %rd1679; | |
mov.b64 {%r2163, %r2164}, %rd1686; | |
shr.u32 %r2165, %r2163, 31; | |
shl.b32 %r2166, %r2164, 1; | |
shr.u32 %r2167, %r2164, 31; | |
shl.b32 %r2168, %r2163, 1; | |
or.b32 %r2169, %r2165, %r2166; | |
or.b32 %r2170, %r2167, %r2168; | |
mov.b64 %rd1687, {%r2170, %r2169}; | |
ld.local.u64 %rd1688, [%rd153]; | |
add.s64 %rd1689, %rd1634, %rd1688; | |
add.s64 %rd1690, %rd1689, %rd1623; | |
xor.b64 %rd1691, %rd1690, %rd1588; | |
mov.b64 {%r2171, %r2172}, %rd1691; | |
mov.b64 %rd1692, {%r2172, %r2171}; | |
add.s64 %rd1693, %rd1692, %rd1605; | |
xor.b64 %rd1694, %rd1693, %rd1623; | |
mov.b64 {%r2173, %r2174}, %rd1694; | |
shr.u32 %r2175, %r2174, 24; | |
shl.b32 %r2176, %r2173, 8; | |
shr.u32 %r2177, %r2173, 24; | |
shl.b32 %r2178, %r2174, 8; | |
or.b32 %r2179, %r2175, %r2176; | |
or.b32 %r2180, %r2177, %r2178; | |
mov.b64 %rd1695, {%r2180, %r2179}; | |
ld.local.u64 %rd1696, [%rd154]; | |
add.s64 %rd1697, %rd1690, %rd1696; | |
add.s64 %rd1698, %rd1697, %rd1695; | |
xor.b64 %rd1699, %rd1698, %rd1692; | |
mov.b64 {%r2181, %r2182}, %rd1699; | |
shr.u32 %r2183, %r2182, 16; | |
shl.b32 %r2184, %r2181, 16; | |
shr.u32 %r2185, %r2181, 16; | |
shl.b32 %r2186, %r2182, 16; | |
or.b32 %r2187, %r2183, %r2184; | |
or.b32 %r2188, %r2185, %r2186; | |
mov.b64 %rd1700, {%r2188, %r2187}; | |
add.s64 %rd1701, %rd1700, %rd1693; | |
xor.b64 %rd1702, %rd1701, %rd1695; | |
mov.b64 {%r2189, %r2190}, %rd1702; | |
shr.u32 %r2191, %r2189, 31; | |
shl.b32 %r2192, %r2190, 1; | |
shr.u32 %r2193, %r2190, 31; | |
shl.b32 %r2194, %r2189, 1; | |
or.b32 %r2195, %r2191, %r2192; | |
or.b32 %r2196, %r2193, %r2194; | |
mov.b64 %rd1703, {%r2196, %r2195}; | |
ld.local.u64 %rd1704, [%rd155]; | |
add.s64 %rd1705, %rd1650, %rd1704; | |
add.s64 %rd1706, %rd1705, %rd1671; | |
xor.b64 %rd1707, %rd1706, %rd1700; | |
mov.b64 {%r2197, %r2198}, %rd1707; | |
mov.b64 %rd1708, {%r2198, %r2197}; | |
add.s64 %rd1709, %rd1708, %rd1685; | |
xor.b64 %rd1710, %rd1709, %rd1671; | |
mov.b64 {%r2199, %r2200}, %rd1710; | |
shr.u32 %r2201, %r2200, 24; | |
shl.b32 %r2202, %r2199, 8; | |
shr.u32 %r2203, %r2199, 24; | |
shl.b32 %r2204, %r2200, 8; | |
or.b32 %r2205, %r2201, %r2202; | |
or.b32 %r2206, %r2203, %r2204; | |
mov.b64 %rd1711, {%r2206, %r2205}; | |
ld.local.u64 %rd1712, [%rd156]; | |
add.s64 %rd1713, %rd1706, %rd1712; | |
add.s64 %rd1714, %rd1713, %rd1711; | |
xor.b64 %rd1715, %rd1714, %rd1708; | |
mov.b64 {%r2207, %r2208}, %rd1715; | |
shr.u32 %r2209, %r2208, 16; | |
shl.b32 %r2210, %r2207, 16; | |
shr.u32 %r2211, %r2207, 16; | |
shl.b32 %r2212, %r2208, 16; | |
or.b32 %r2213, %r2209, %r2210; | |
or.b32 %r2214, %r2211, %r2212; | |
mov.b64 %rd1716, {%r2214, %r2213}; | |
add.s64 %rd1717, %rd1716, %rd1709; | |
xor.b64 %rd1718, %rd1717, %rd1711; | |
mov.b64 {%r2215, %r2216}, %rd1718; | |
shr.u32 %r2217, %r2215, 31; | |
shl.b32 %r2218, %r2216, 1; | |
shr.u32 %r2219, %r2216, 31; | |
shl.b32 %r2220, %r2215, 1; | |
or.b32 %r2221, %r2217, %r2218; | |
or.b32 %r2222, %r2219, %r2220; | |
mov.b64 %rd1719, {%r2222, %r2221}; | |
ld.local.u64 %rd1720, [%rd157]; | |
add.s64 %rd1721, %rd1666, %rd1720; | |
add.s64 %rd1722, %rd1721, %rd1687; | |
xor.b64 %rd1723, %rd1722, %rd1652; | |
mov.b64 {%r2223, %r2224}, %rd1723; | |
mov.b64 %rd1724, {%r2224, %r2223}; | |
add.s64 %rd1725, %rd1724, %rd1701; | |
xor.b64 %rd1726, %rd1725, %rd1687; | |
mov.b64 {%r2225, %r2226}, %rd1726; | |
shr.u32 %r2227, %r2226, 24; | |
shl.b32 %r2228, %r2225, 8; | |
shr.u32 %r2229, %r2225, 24; | |
shl.b32 %r2230, %r2226, 8; | |
or.b32 %r2231, %r2227, %r2228; | |
or.b32 %r2232, %r2229, %r2230; | |
mov.b64 %rd1727, {%r2232, %r2231}; | |
ld.local.u64 %rd1728, [%rd158]; | |
add.s64 %rd1729, %rd1722, %rd1728; | |
add.s64 %rd1730, %rd1729, %rd1727; | |
xor.b64 %rd1731, %rd1730, %rd1724; | |
mov.b64 {%r2233, %r2234}, %rd1731; | |
shr.u32 %r2235, %r2234, 16; | |
shl.b32 %r2236, %r2233, 16; | |
shr.u32 %r2237, %r2233, 16; | |
shl.b32 %r2238, %r2234, 16; | |
or.b32 %r2239, %r2235, %r2236; | |
or.b32 %r2240, %r2237, %r2238; | |
mov.b64 %rd1732, {%r2240, %r2239}; | |
add.s64 %rd1733, %rd1732, %rd1725; | |
xor.b64 %rd1734, %rd1733, %rd1727; | |
mov.b64 {%r2241, %r2242}, %rd1734; | |
shr.u32 %r2243, %r2241, 31; | |
shl.b32 %r2244, %r2242, 1; | |
shr.u32 %r2245, %r2242, 31; | |
shl.b32 %r2246, %r2241, 1; | |
or.b32 %r2247, %r2243, %r2244; | |
or.b32 %r2248, %r2245, %r2246; | |
mov.b64 %rd1735, {%r2248, %r2247}; | |
ld.local.u64 %rd1736, [%rd159]; | |
add.s64 %rd1737, %rd1682, %rd1736; | |
add.s64 %rd1738, %rd1737, %rd1703; | |
xor.b64 %rd1739, %rd1738, %rd1668; | |
mov.b64 {%r2249, %r2250}, %rd1739; | |
mov.b64 %rd1740, {%r2250, %r2249}; | |
add.s64 %rd1741, %rd1740, %rd1653; | |
xor.b64 %rd1742, %rd1741, %rd1703; | |
mov.b64 {%r2251, %r2252}, %rd1742; | |
shr.u32 %r2253, %r2252, 24; | |
shl.b32 %r2254, %r2251, 8; | |
shr.u32 %r2255, %r2251, 24; | |
shl.b32 %r2256, %r2252, 8; | |
or.b32 %r2257, %r2253, %r2254; | |
or.b32 %r2258, %r2255, %r2256; | |
mov.b64 %rd1743, {%r2258, %r2257}; | |
ld.local.u64 %rd1744, [%rd160]; | |
add.s64 %rd1745, %rd1738, %rd1744; | |
add.s64 %rd1746, %rd1745, %rd1743; | |
xor.b64 %rd1747, %rd1746, %rd1740; | |
mov.b64 {%r2259, %r2260}, %rd1747; | |
shr.u32 %r2261, %r2260, 16; | |
shl.b32 %r2262, %r2259, 16; | |
shr.u32 %r2263, %r2259, 16; | |
shl.b32 %r2264, %r2260, 16; | |
or.b32 %r2265, %r2261, %r2262; | |
or.b32 %r2266, %r2263, %r2264; | |
mov.b64 %rd1748, {%r2266, %r2265}; | |
add.s64 %rd1749, %rd1748, %rd1741; | |
xor.b64 %rd1750, %rd1749, %rd1743; | |
mov.b64 {%r2267, %r2268}, %rd1750; | |
shr.u32 %r2269, %r2267, 31; | |
shl.b32 %r2270, %r2268, 1; | |
shr.u32 %r2271, %r2268, 31; | |
shl.b32 %r2272, %r2267, 1; | |
or.b32 %r2273, %r2269, %r2270; | |
or.b32 %r2274, %r2271, %r2272; | |
mov.b64 %rd1751, {%r2274, %r2273}; | |
ld.local.u64 %rd1752, [%rd161]; | |
add.s64 %rd1753, %rd1698, %rd1752; | |
add.s64 %rd1754, %rd1753, %rd1655; | |
xor.b64 %rd1755, %rd1754, %rd1684; | |
mov.b64 {%r2275, %r2276}, %rd1755; | |
mov.b64 %rd1756, {%r2276, %r2275}; | |
add.s64 %rd1757, %rd1756, %rd1669; | |
xor.b64 %rd1758, %rd1757, %rd1655; | |
mov.b64 {%r2277, %r2278}, %rd1758; | |
shr.u32 %r2279, %r2278, 24; | |
shl.b32 %r2280, %r2277, 8; | |
shr.u32 %r2281, %r2277, 24; | |
shl.b32 %r2282, %r2278, 8; | |
or.b32 %r2283, %r2279, %r2280; | |
or.b32 %r2284, %r2281, %r2282; | |
mov.b64 %rd1759, {%r2284, %r2283}; | |
ld.local.u64 %rd1760, [%rd162]; | |
add.s64 %rd1761, %rd1754, %rd1760; | |
add.s64 %rd1762, %rd1761, %rd1759; | |
xor.b64 %rd1763, %rd1762, %rd1756; | |
mov.b64 {%r2285, %r2286}, %rd1763; | |
shr.u32 %r2287, %r2286, 16; | |
shl.b32 %r2288, %r2285, 16; | |
shr.u32 %r2289, %r2285, 16; | |
shl.b32 %r2290, %r2286, 16; | |
or.b32 %r2291, %r2287, %r2288; | |
or.b32 %r2292, %r2289, %r2290; | |
mov.b64 %rd1764, {%r2292, %r2291}; | |
add.s64 %rd1765, %rd1764, %rd1757; | |
xor.b64 %rd1766, %rd1765, %rd1759; | |
mov.b64 {%r2293, %r2294}, %rd1766; | |
shr.u32 %r2295, %r2293, 31; | |
shl.b32 %r2296, %r2294, 1; | |
shr.u32 %r2297, %r2294, 31; | |
shl.b32 %r2298, %r2293, 1; | |
or.b32 %r2299, %r2295, %r2296; | |
or.b32 %r2300, %r2297, %r2298; | |
mov.b64 %rd1767, {%r2300, %r2299}; | |
ld.local.u64 %rd1768, [%rd163]; | |
add.s64 %rd1769, %rd1714, %rd1768; | |
add.s64 %rd1770, %rd1769, %rd1767; | |
xor.b64 %rd1771, %rd1770, %rd1732; | |
mov.b64 {%r2301, %r2302}, %rd1771; | |
mov.b64 %rd1772, {%r2302, %r2301}; | |
add.s64 %rd1773, %rd1772, %rd1749; | |
xor.b64 %rd1774, %rd1773, %rd1767; | |
mov.b64 {%r2303, %r2304}, %rd1774; | |
shr.u32 %r2305, %r2304, 24; | |
shl.b32 %r2306, %r2303, 8; | |
shr.u32 %r2307, %r2303, 24; | |
shl.b32 %r2308, %r2304, 8; | |
or.b32 %r2309, %r2305, %r2306; | |
or.b32 %r2310, %r2307, %r2308; | |
mov.b64 %rd1775, {%r2310, %r2309}; | |
ld.local.u64 %rd1776, [%rd164]; | |
add.s64 %rd1777, %rd1770, %rd1776; | |
add.s64 %rd1778, %rd1777, %rd1775; | |
xor.b64 %rd1779, %rd1778, %rd1772; | |
mov.b64 {%r2311, %r2312}, %rd1779; | |
shr.u32 %r2313, %r2312, 16; | |
shl.b32 %r2314, %r2311, 16; | |
shr.u32 %r2315, %r2311, 16; | |
shl.b32 %r2316, %r2312, 16; | |
or.b32 %r2317, %r2313, %r2314; | |
or.b32 %r2318, %r2315, %r2316; | |
mov.b64 %rd1780, {%r2318, %r2317}; | |
add.s64 %rd1781, %rd1780, %rd1773; | |
xor.b64 %rd1782, %rd1781, %rd1775; | |
mov.b64 {%r2319, %r2320}, %rd1782; | |
shr.u32 %r2321, %r2319, 31; | |
shl.b32 %r2322, %r2320, 1; | |
shr.u32 %r2323, %r2320, 31; | |
shl.b32 %r2324, %r2319, 1; | |
or.b32 %r2325, %r2321, %r2322; | |
or.b32 %r2326, %r2323, %r2324; | |
mov.b64 %rd1783, {%r2326, %r2325}; | |
ld.local.u64 %rd1784, [%rd165]; | |
add.s64 %rd1785, %rd1730, %rd1784; | |
add.s64 %rd1786, %rd1785, %rd1719; | |
xor.b64 %rd1787, %rd1786, %rd1748; | |
mov.b64 {%r2327, %r2328}, %rd1787; | |
mov.b64 %rd1788, {%r2328, %r2327}; | |
add.s64 %rd1789, %rd1788, %rd1765; | |
xor.b64 %rd1790, %rd1789, %rd1719; | |
mov.b64 {%r2329, %r2330}, %rd1790; | |
shr.u32 %r2331, %r2330, 24; | |
shl.b32 %r2332, %r2329, 8; | |
shr.u32 %r2333, %r2329, 24; | |
shl.b32 %r2334, %r2330, 8; | |
or.b32 %r2335, %r2331, %r2332; | |
or.b32 %r2336, %r2333, %r2334; | |
mov.b64 %rd1791, {%r2336, %r2335}; | |
ld.local.u64 %rd1792, [%rd166]; | |
add.s64 %rd1793, %rd1786, %rd1792; | |
add.s64 %rd1794, %rd1793, %rd1791; | |
xor.b64 %rd1795, %rd1794, %rd1788; | |
mov.b64 {%r2337, %r2338}, %rd1795; | |
shr.u32 %r2339, %r2338, 16; | |
shl.b32 %r2340, %r2337, 16; | |
shr.u32 %r2341, %r2337, 16; | |
shl.b32 %r2342, %r2338, 16; | |
or.b32 %r2343, %r2339, %r2340; | |
or.b32 %r2344, %r2341, %r2342; | |
mov.b64 %rd1796, {%r2344, %r2343}; | |
add.s64 %rd1797, %rd1796, %rd1789; | |
xor.b64 %rd1798, %rd1797, %rd1791; | |
mov.b64 {%r2345, %r2346}, %rd1798; | |
shr.u32 %r2347, %r2345, 31; | |
shl.b32 %r2348, %r2346, 1; | |
shr.u32 %r2349, %r2346, 31; | |
shl.b32 %r2350, %r2345, 1; | |
or.b32 %r2351, %r2347, %r2348; | |
or.b32 %r2352, %r2349, %r2350; | |
mov.b64 %rd1799, {%r2352, %r2351}; | |
ld.local.u64 %rd1800, [%rd167]; | |
add.s64 %rd1801, %rd1746, %rd1800; | |
add.s64 %rd1802, %rd1801, %rd1735; | |
xor.b64 %rd1803, %rd1802, %rd1764; | |
mov.b64 {%r2353, %r2354}, %rd1803; | |
mov.b64 %rd1804, {%r2354, %r2353}; | |
add.s64 %rd1805, %rd1804, %rd1717; | |
xor.b64 %rd1806, %rd1805, %rd1735; | |
mov.b64 {%r2355, %r2356}, %rd1806; | |
shr.u32 %r2357, %r2356, 24; | |
shl.b32 %r2358, %r2355, 8; | |
shr.u32 %r2359, %r2355, 24; | |
shl.b32 %r2360, %r2356, 8; | |
or.b32 %r2361, %r2357, %r2358; | |
or.b32 %r2362, %r2359, %r2360; | |
mov.b64 %rd1807, {%r2362, %r2361}; | |
ld.local.u64 %rd1808, [%rd168]; | |
add.s64 %rd1809, %rd1802, %rd1808; | |
add.s64 %rd1810, %rd1809, %rd1807; | |
xor.b64 %rd1811, %rd1810, %rd1804; | |
mov.b64 {%r2363, %r2364}, %rd1811; | |
shr.u32 %r2365, %r2364, 16; | |
shl.b32 %r2366, %r2363, 16; | |
shr.u32 %r2367, %r2363, 16; | |
shl.b32 %r2368, %r2364, 16; | |
or.b32 %r2369, %r2365, %r2366; | |
or.b32 %r2370, %r2367, %r2368; | |
mov.b64 %rd1812, {%r2370, %r2369}; | |
add.s64 %rd1813, %rd1812, %rd1805; | |
xor.b64 %rd1814, %rd1813, %rd1807; | |
mov.b64 {%r2371, %r2372}, %rd1814; | |
shr.u32 %r2373, %r2371, 31; | |
shl.b32 %r2374, %r2372, 1; | |
shr.u32 %r2375, %r2372, 31; | |
shl.b32 %r2376, %r2371, 1; | |
or.b32 %r2377, %r2373, %r2374; | |
or.b32 %r2378, %r2375, %r2376; | |
mov.b64 %rd1815, {%r2378, %r2377}; | |
ld.local.u64 %rd1816, [%rd169]; | |
add.s64 %rd1817, %rd1762, %rd1816; | |
add.s64 %rd1818, %rd1817, %rd1751; | |
xor.b64 %rd1819, %rd1818, %rd1716; | |
mov.b64 {%r2379, %r2380}, %rd1819; | |
mov.b64 %rd1820, {%r2380, %r2379}; | |
add.s64 %rd1821, %rd1820, %rd1733; | |
xor.b64 %rd1822, %rd1821, %rd1751; | |
mov.b64 {%r2381, %r2382}, %rd1822; | |
shr.u32 %r2383, %r2382, 24; | |
shl.b32 %r2384, %r2381, 8; | |
shr.u32 %r2385, %r2381, 24; | |
shl.b32 %r2386, %r2382, 8; | |
or.b32 %r2387, %r2383, %r2384; | |
or.b32 %r2388, %r2385, %r2386; | |
mov.b64 %rd1823, {%r2388, %r2387}; | |
ld.local.u64 %rd1824, [%rd170]; | |
add.s64 %rd1825, %rd1818, %rd1824; | |
add.s64 %rd1826, %rd1825, %rd1823; | |
xor.b64 %rd1827, %rd1826, %rd1820; | |
mov.b64 {%r2389, %r2390}, %rd1827; | |
shr.u32 %r2391, %r2390, 16; | |
shl.b32 %r2392, %r2389, 16; | |
shr.u32 %r2393, %r2389, 16; | |
shl.b32 %r2394, %r2390, 16; | |
or.b32 %r2395, %r2391, %r2392; | |
or.b32 %r2396, %r2393, %r2394; | |
mov.b64 %rd1828, {%r2396, %r2395}; | |
add.s64 %rd1829, %rd1828, %rd1821; | |
xor.b64 %rd1830, %rd1829, %rd1823; | |
mov.b64 {%r2397, %r2398}, %rd1830; | |
shr.u32 %r2399, %r2397, 31; | |
shl.b32 %r2400, %r2398, 1; | |
shr.u32 %r2401, %r2398, 31; | |
shl.b32 %r2402, %r2397, 1; | |
or.b32 %r2403, %r2399, %r2400; | |
or.b32 %r2404, %r2401, %r2402; | |
mov.b64 %rd1831, {%r2404, %r2403}; | |
ld.local.u64 %rd1832, [%rd171]; | |
add.s64 %rd1833, %rd1778, %rd1832; | |
add.s64 %rd1834, %rd1833, %rd1799; | |
xor.b64 %rd1835, %rd1834, %rd1828; | |
mov.b64 {%r2405, %r2406}, %rd1835; | |
mov.b64 %rd1836, {%r2406, %r2405}; | |
add.s64 %rd1837, %rd1836, %rd1813; | |
xor.b64 %rd1838, %rd1837, %rd1799; | |
mov.b64 {%r2407, %r2408}, %rd1838; | |
shr.u32 %r2409, %r2408, 24; | |
shl.b32 %r2410, %r2407, 8; | |
shr.u32 %r2411, %r2407, 24; | |
shl.b32 %r2412, %r2408, 8; | |
or.b32 %r2413, %r2409, %r2410; | |
or.b32 %r2414, %r2411, %r2412; | |
mov.b64 %rd1839, {%r2414, %r2413}; | |
ld.local.u64 %rd1840, [%rd172]; | |
add.s64 %rd1841, %rd1834, %rd1840; | |
add.s64 %rd1842, %rd1841, %rd1839; | |
xor.b64 %rd1843, %rd1842, %rd1836; | |
mov.b64 {%r2415, %r2416}, %rd1843; | |
shr.u32 %r2417, %r2416, 16; | |
shl.b32 %r2418, %r2415, 16; | |
shr.u32 %r2419, %r2415, 16; | |
shl.b32 %r2420, %r2416, 16; | |
or.b32 %r2421, %r2417, %r2418; | |
or.b32 %r2422, %r2419, %r2420; | |
mov.b64 %rd1844, {%r2422, %r2421}; | |
add.s64 %rd1845, %rd1844, %rd1837; | |
xor.b64 %rd1846, %rd1845, %rd1839; | |
mov.b64 {%r2423, %r2424}, %rd1846; | |
shr.u32 %r2425, %r2423, 31; | |
shl.b32 %r2426, %r2424, 1; | |
shr.u32 %r2427, %r2424, 31; | |
shl.b32 %r2428, %r2423, 1; | |
or.b32 %r2429, %r2425, %r2426; | |
or.b32 %r2430, %r2427, %r2428; | |
mov.b64 %rd1847, {%r2430, %r2429}; | |
ld.local.u64 %rd1848, [%rd173]; | |
add.s64 %rd1849, %rd1794, %rd1848; | |
add.s64 %rd1850, %rd1849, %rd1815; | |
xor.b64 %rd1851, %rd1850, %rd1780; | |
mov.b64 {%r2431, %r2432}, %rd1851; | |
mov.b64 %rd1852, {%r2432, %r2431}; | |
add.s64 %rd1853, %rd1852, %rd1829; | |
xor.b64 %rd1854, %rd1853, %rd1815; | |
mov.b64 {%r2433, %r2434}, %rd1854; | |
shr.u32 %r2435, %r2434, 24; | |
shl.b32 %r2436, %r2433, 8; | |
shr.u32 %r2437, %r2433, 24; | |
shl.b32 %r2438, %r2434, 8; | |
or.b32 %r2439, %r2435, %r2436; | |
or.b32 %r2440, %r2437, %r2438; | |
mov.b64 %rd1855, {%r2440, %r2439}; | |
ld.local.u64 %rd1856, [%rd174]; | |
add.s64 %rd1857, %rd1850, %rd1856; | |
add.s64 %rd1858, %rd1857, %rd1855; | |
xor.b64 %rd1859, %rd1858, %rd1852; | |
mov.b64 {%r2441, %r2442}, %rd1859; | |
shr.u32 %r2443, %r2442, 16; | |
shl.b32 %r2444, %r2441, 16; | |
shr.u32 %r2445, %r2441, 16; | |
shl.b32 %r2446, %r2442, 16; | |
or.b32 %r2447, %r2443, %r2444; | |
or.b32 %r2448, %r2445, %r2446; | |
mov.b64 %rd1860, {%r2448, %r2447}; | |
add.s64 %rd1861, %rd1860, %rd1853; | |
xor.b64 %rd1862, %rd1861, %rd1855; | |
mov.b64 {%r2449, %r2450}, %rd1862; | |
shr.u32 %r2451, %r2449, 31; | |
shl.b32 %r2452, %r2450, 1; | |
shr.u32 %r2453, %r2450, 31; | |
shl.b32 %r2454, %r2449, 1; | |
or.b32 %r2455, %r2451, %r2452; | |
or.b32 %r2456, %r2453, %r2454; | |
mov.b64 %rd1863, {%r2456, %r2455}; | |
ld.local.u64 %rd1864, [%rd175]; | |
add.s64 %rd1865, %rd1810, %rd1864; | |
add.s64 %rd1866, %rd1865, %rd1831; | |
xor.b64 %rd1867, %rd1866, %rd1796; | |
mov.b64 {%r2457, %r2458}, %rd1867; | |
mov.b64 %rd1868, {%r2458, %r2457}; | |
add.s64 %rd1869, %rd1868, %rd1781; | |
xor.b64 %rd1870, %rd1869, %rd1831; | |
mov.b64 {%r2459, %r2460}, %rd1870; | |
shr.u32 %r2461, %r2460, 24; | |
shl.b32 %r2462, %r2459, 8; | |
shr.u32 %r2463, %r2459, 24; | |
shl.b32 %r2464, %r2460, 8; | |
or.b32 %r2465, %r2461, %r2462; | |
or.b32 %r2466, %r2463, %r2464; | |
mov.b64 %rd1871, {%r2466, %r2465}; | |
ld.local.u64 %rd1872, [%rd176]; | |
add.s64 %rd1873, %rd1866, %rd1872; | |
add.s64 %rd1874, %rd1873, %rd1871; | |
xor.b64 %rd1875, %rd1874, %rd1868; | |
mov.b64 {%r2467, %r2468}, %rd1875; | |
shr.u32 %r2469, %r2468, 16; | |
shl.b32 %r2470, %r2467, 16; | |
shr.u32 %r2471, %r2467, 16; | |
shl.b32 %r2472, %r2468, 16; | |
or.b32 %r2473, %r2469, %r2470; | |
or.b32 %r2474, %r2471, %r2472; | |
mov.b64 %rd1876, {%r2474, %r2473}; | |
add.s64 %rd1877, %rd1876, %rd1869; | |
xor.b64 %rd1878, %rd1877, %rd1871; | |
mov.b64 {%r2475, %r2476}, %rd1878; | |
shr.u32 %r2477, %r2475, 31; | |
shl.b32 %r2478, %r2476, 1; | |
shr.u32 %r2479, %r2476, 31; | |
shl.b32 %r2480, %r2475, 1; | |
or.b32 %r2481, %r2477, %r2478; | |
or.b32 %r2482, %r2479, %r2480; | |
mov.b64 %rd1879, {%r2482, %r2481}; | |
ld.local.u64 %rd1880, [%rd177]; | |
add.s64 %rd1881, %rd1826, %rd1880; | |
add.s64 %rd1882, %rd1881, %rd1783; | |
xor.b64 %rd1883, %rd1882, %rd1812; | |
mov.b64 {%r2483, %r2484}, %rd1883; | |
mov.b64 %rd1884, {%r2484, %r2483}; | |
add.s64 %rd1885, %rd1884, %rd1797; | |
xor.b64 %rd1886, %rd1885, %rd1783; | |
mov.b64 {%r2485, %r2486}, %rd1886; | |
shr.u32 %r2487, %r2486, 24; | |
shl.b32 %r2488, %r2485, 8; | |
shr.u32 %r2489, %r2485, 24; | |
shl.b32 %r2490, %r2486, 8; | |
or.b32 %r2491, %r2487, %r2488; | |
or.b32 %r2492, %r2489, %r2490; | |
mov.b64 %rd1887, {%r2492, %r2491}; | |
ld.local.u64 %rd1888, [%rd178]; | |
add.s64 %rd1889, %rd1882, %rd1888; | |
add.s64 %rd1890, %rd1889, %rd1887; | |
xor.b64 %rd1891, %rd1890, %rd1884; | |
mov.b64 {%r2493, %r2494}, %rd1891; | |
shr.u32 %r2495, %r2494, 16; | |
shl.b32 %r2496, %r2493, 16; | |
shr.u32 %r2497, %r2493, 16; | |
shl.b32 %r2498, %r2494, 16; | |
or.b32 %r2499, %r2495, %r2496; | |
or.b32 %r2500, %r2497, %r2498; | |
mov.b64 %rd1892, {%r2500, %r2499}; | |
add.s64 %rd1893, %rd1892, %rd1885; | |
xor.b64 %rd1894, %rd1893, %rd1887; | |
mov.b64 {%r2501, %r2502}, %rd1894; | |
shr.u32 %r2503, %r2501, 31; | |
shl.b32 %r2504, %r2502, 1; | |
shr.u32 %r2505, %r2502, 31; | |
shl.b32 %r2506, %r2501, 1; | |
or.b32 %r2507, %r2503, %r2504; | |
or.b32 %r2508, %r2505, %r2506; | |
mov.b64 %rd1895, {%r2508, %r2507}; | |
ld.local.u64 %rd1896, [%rd179]; | |
add.s64 %rd1897, %rd1842, %rd1896; | |
add.s64 %rd1898, %rd1897, %rd1895; | |
xor.b64 %rd1899, %rd1898, %rd1860; | |
mov.b64 {%r2509, %r2510}, %rd1899; | |
mov.b64 %rd1900, {%r2510, %r2509}; | |
add.s64 %rd1901, %rd1900, %rd1877; | |
xor.b64 %rd1902, %rd1901, %rd1895; | |
mov.b64 {%r2511, %r2512}, %rd1902; | |
shr.u32 %r2513, %r2512, 24; | |
shl.b32 %r2514, %r2511, 8; | |
shr.u32 %r2515, %r2511, 24; | |
shl.b32 %r2516, %r2512, 8; | |
or.b32 %r2517, %r2513, %r2514; | |
or.b32 %r2518, %r2515, %r2516; | |
mov.b64 %rd1903, {%r2518, %r2517}; | |
ld.local.u64 %rd1904, [%rd180]; | |
add.s64 %rd1905, %rd1898, %rd1904; | |
add.s64 %rd1906, %rd1905, %rd1903; | |
xor.b64 %rd1907, %rd1906, %rd1900; | |
mov.b64 {%r2519, %r2520}, %rd1907; | |
shr.u32 %r2521, %r2520, 16; | |
shl.b32 %r2522, %r2519, 16; | |
shr.u32 %r2523, %r2519, 16; | |
shl.b32 %r2524, %r2520, 16; | |
or.b32 %r2525, %r2521, %r2522; | |
or.b32 %r2526, %r2523, %r2524; | |
mov.b64 %rd1908, {%r2526, %r2525}; | |
add.s64 %rd1909, %rd1908, %rd1901; | |
xor.b64 %rd1910, %rd1909, %rd1903; | |
mov.b64 {%r2527, %r2528}, %rd1910; | |
shr.u32 %r2529, %r2527, 31; | |
shl.b32 %r2530, %r2528, 1; | |
shr.u32 %r2531, %r2528, 31; | |
shl.b32 %r2532, %r2527, 1; | |
or.b32 %r2533, %r2529, %r2530; | |
or.b32 %r2534, %r2531, %r2532; | |
mov.b64 %rd1911, {%r2534, %r2533}; | |
ld.local.u64 %rd1912, [%rd181]; | |
add.s64 %rd1913, %rd1858, %rd1912; | |
add.s64 %rd1914, %rd1913, %rd1847; | |
xor.b64 %rd1915, %rd1914, %rd1876; | |
mov.b64 {%r2535, %r2536}, %rd1915; | |
mov.b64 %rd1916, {%r2536, %r2535}; | |
add.s64 %rd1917, %rd1916, %rd1893; | |
xor.b64 %rd1918, %rd1917, %rd1847; | |
mov.b64 {%r2537, %r2538}, %rd1918; | |
shr.u32 %r2539, %r2538, 24; | |
shl.b32 %r2540, %r2537, 8; | |
shr.u32 %r2541, %r2537, 24; | |
shl.b32 %r2542, %r2538, 8; | |
or.b32 %r2543, %r2539, %r2540; | |
or.b32 %r2544, %r2541, %r2542; | |
mov.b64 %rd1919, {%r2544, %r2543}; | |
ld.local.u64 %rd1920, [%rd182]; | |
add.s64 %rd1921, %rd1914, %rd1920; | |
add.s64 %rd1922, %rd1921, %rd1919; | |
xor.b64 %rd1923, %rd1922, %rd1916; | |
mov.b64 {%r2545, %r2546}, %rd1923; | |
shr.u32 %r2547, %r2546, 16; | |
shl.b32 %r2548, %r2545, 16; | |
shr.u32 %r2549, %r2545, 16; | |
shl.b32 %r2550, %r2546, 16; | |
or.b32 %r2551, %r2547, %r2548; | |
or.b32 %r2552, %r2549, %r2550; | |
mov.b64 %rd1924, {%r2552, %r2551}; | |
add.s64 %rd1925, %rd1924, %rd1917; | |
xor.b64 %rd1926, %rd1925, %rd1919; | |
mov.b64 {%r2553, %r2554}, %rd1926; | |
shr.u32 %r2555, %r2553, 31; | |
shl.b32 %r2556, %r2554, 1; | |
shr.u32 %r2557, %r2554, 31; | |
shl.b32 %r2558, %r2553, 1; | |
or.b32 %r2559, %r2555, %r2556; | |
or.b32 %r2560, %r2557, %r2558; | |
mov.b64 %rd1927, {%r2560, %r2559}; | |
ld.local.u64 %rd1928, [%rd183]; | |
add.s64 %rd1929, %rd1874, %rd1928; | |
add.s64 %rd1930, %rd1929, %rd1863; | |
xor.b64 %rd1931, %rd1930, %rd1892; | |
mov.b64 {%r2561, %r2562}, %rd1931; | |
mov.b64 %rd1932, {%r2562, %r2561}; | |
add.s64 %rd1933, %rd1932, %rd1845; | |
xor.b64 %rd1934, %rd1933, %rd1863; | |
mov.b64 {%r2563, %r2564}, %rd1934; | |
shr.u32 %r2565, %r2564, 24; | |
shl.b32 %r2566, %r2563, 8; | |
shr.u32 %r2567, %r2563, 24; | |
shl.b32 %r2568, %r2564, 8; | |
or.b32 %r2569, %r2565, %r2566; | |
or.b32 %r2570, %r2567, %r2568; | |
mov.b64 %rd1935, {%r2570, %r2569}; | |
ld.local.u64 %rd1936, [%rd184]; | |
add.s64 %rd1937, %rd1930, %rd1936; | |
add.s64 %rd1938, %rd1937, %rd1935; | |
xor.b64 %rd1939, %rd1938, %rd1932; | |
mov.b64 {%r2571, %r2572}, %rd1939; | |
shr.u32 %r2573, %r2572, 16; | |
shl.b32 %r2574, %r2571, 16; | |
shr.u32 %r2575, %r2571, 16; | |
shl.b32 %r2576, %r2572, 16; | |
or.b32 %r2577, %r2573, %r2574; | |
or.b32 %r2578, %r2575, %r2576; | |
mov.b64 %rd1940, {%r2578, %r2577}; | |
add.s64 %rd1941, %rd1940, %rd1933; | |
xor.b64 %rd1942, %rd1941, %rd1935; | |
mov.b64 {%r2579, %r2580}, %rd1942; | |
shr.u32 %r2581, %r2579, 31; | |
shl.b32 %r2582, %r2580, 1; | |
shr.u32 %r2583, %r2580, 31; | |
shl.b32 %r2584, %r2579, 1; | |
or.b32 %r2585, %r2581, %r2582; | |
or.b32 %r2586, %r2583, %r2584; | |
mov.b64 %rd1943, {%r2586, %r2585}; | |
ld.local.u64 %rd1944, [%rd185]; | |
add.s64 %rd1945, %rd1890, %rd1944; | |
add.s64 %rd1946, %rd1945, %rd1879; | |
xor.b64 %rd1947, %rd1946, %rd1844; | |
mov.b64 {%r2587, %r2588}, %rd1947; | |
mov.b64 %rd1948, {%r2588, %r2587}; | |
add.s64 %rd1949, %rd1948, %rd1861; | |
xor.b64 %rd1950, %rd1949, %rd1879; | |
mov.b64 {%r2589, %r2590}, %rd1950; | |
shr.u32 %r2591, %r2590, 24; | |
shl.b32 %r2592, %r2589, 8; | |
shr.u32 %r2593, %r2589, 24; | |
shl.b32 %r2594, %r2590, 8; | |
or.b32 %r2595, %r2591, %r2592; | |
or.b32 %r2596, %r2593, %r2594; | |
mov.b64 %rd1951, {%r2596, %r2595}; | |
ld.local.u64 %rd1952, [%rd186]; | |
add.s64 %rd1953, %rd1946, %rd1952; | |
add.s64 %rd1954, %rd1953, %rd1951; | |
xor.b64 %rd1955, %rd1954, %rd1948; | |
mov.b64 {%r2597, %r2598}, %rd1955; | |
shr.u32 %r2599, %r2598, 16; | |
shl.b32 %r2600, %r2597, 16; | |
shr.u32 %r2601, %r2597, 16; | |
shl.b32 %r2602, %r2598, 16; | |
or.b32 %r2603, %r2599, %r2600; | |
or.b32 %r2604, %r2601, %r2602; | |
mov.b64 %rd1956, {%r2604, %r2603}; | |
add.s64 %rd1957, %rd1956, %rd1949; | |
xor.b64 %rd1958, %rd1957, %rd1951; | |
mov.b64 {%r2605, %r2606}, %rd1958; | |
shr.u32 %r2607, %r2605, 31; | |
shl.b32 %r2608, %r2606, 1; | |
shr.u32 %r2609, %r2606, 31; | |
shl.b32 %r2610, %r2605, 1; | |
or.b32 %r2611, %r2607, %r2608; | |
or.b32 %r2612, %r2609, %r2610; | |
mov.b64 %rd1959, {%r2612, %r2611}; | |
ld.local.u64 %rd1960, [%rd187]; | |
add.s64 %rd1961, %rd1906, %rd1960; | |
add.s64 %rd1962, %rd1961, %rd1927; | |
xor.b64 %rd1963, %rd1962, %rd1956; | |
mov.b64 {%r2613, %r2614}, %rd1963; | |
mov.b64 %rd1964, {%r2614, %r2613}; | |
add.s64 %rd1965, %rd1964, %rd1941; | |
xor.b64 %rd1966, %rd1965, %rd1927; | |
mov.b64 {%r2615, %r2616}, %rd1966; | |
shr.u32 %r2617, %r2616, 24; | |
shl.b32 %r2618, %r2615, 8; | |
shr.u32 %r2619, %r2615, 24; | |
shl.b32 %r2620, %r2616, 8; | |
or.b32 %r2621, %r2617, %r2618; | |
or.b32 %r2622, %r2619, %r2620; | |
mov.b64 %rd1967, {%r2622, %r2621}; | |
ld.local.u64 %rd1968, [%rd188]; | |
add.s64 %rd1969, %rd1962, %rd1968; | |
add.s64 %rd1970, %rd1969, %rd1967; | |
xor.b64 %rd1971, %rd1970, %rd1964; | |
mov.b64 {%r2623, %r2624}, %rd1971; | |
shr.u32 %r2625, %r2624, 16; | |
shl.b32 %r2626, %r2623, 16; | |
shr.u32 %r2627, %r2623, 16; | |
shl.b32 %r2628, %r2624, 16; | |
or.b32 %r2629, %r2625, %r2626; | |
or.b32 %r2630, %r2627, %r2628; | |
mov.b64 %rd1972, {%r2630, %r2629}; | |
add.s64 %rd1973, %rd1972, %rd1965; | |
xor.b64 %rd1974, %rd1973, %rd1967; | |
mov.b64 {%r2631, %r2632}, %rd1974; | |
shr.u32 %r2633, %r2631, 31; | |
shl.b32 %r2634, %r2632, 1; | |
shr.u32 %r2635, %r2632, 31; | |
shl.b32 %r2636, %r2631, 1; | |
or.b32 %r2637, %r2633, %r2634; | |
or.b32 %r2638, %r2635, %r2636; | |
mov.b64 %rd1975, {%r2638, %r2637}; | |
ld.local.u64 %rd1976, [%rd189]; | |
add.s64 %rd1977, %rd1922, %rd1976; | |
add.s64 %rd1978, %rd1977, %rd1943; | |
xor.b64 %rd1979, %rd1978, %rd1908; | |
mov.b64 {%r2639, %r2640}, %rd1979; | |
mov.b64 %rd1980, {%r2640, %r2639}; | |
add.s64 %rd1981, %rd1980, %rd1957; | |
xor.b64 %rd1982, %rd1981, %rd1943; | |
mov.b64 {%r2641, %r2642}, %rd1982; | |
shr.u32 %r2643, %r2642, 24; | |
shl.b32 %r2644, %r2641, 8; | |
shr.u32 %r2645, %r2641, 24; | |
shl.b32 %r2646, %r2642, 8; | |
or.b32 %r2647, %r2643, %r2644; | |
or.b32 %r2648, %r2645, %r2646; | |
mov.b64 %rd1983, {%r2648, %r2647}; | |
ld.local.u64 %rd1984, [%rd190]; | |
add.s64 %rd1985, %rd1978, %rd1984; | |
add.s64 %rd1986, %rd1985, %rd1983; | |
xor.b64 %rd1987, %rd1986, %rd1980; | |
mov.b64 {%r2649, %r2650}, %rd1987; | |
shr.u32 %r2651, %r2650, 16; | |
shl.b32 %r2652, %r2649, 16; | |
shr.u32 %r2653, %r2649, 16; | |
shl.b32 %r2654, %r2650, 16; | |
or.b32 %r2655, %r2651, %r2652; | |
or.b32 %r2656, %r2653, %r2654; | |
mov.b64 %rd1988, {%r2656, %r2655}; | |
add.s64 %rd1989, %rd1988, %rd1981; | |
xor.b64 %rd1990, %rd1989, %rd1983; | |
mov.b64 {%r2657, %r2658}, %rd1990; | |
shr.u32 %r2659, %r2657, 31; | |
shl.b32 %r2660, %r2658, 1; | |
shr.u32 %r2661, %r2658, 31; | |
shl.b32 %r2662, %r2657, 1; | |
or.b32 %r2663, %r2659, %r2660; | |
or.b32 %r2664, %r2661, %r2662; | |
mov.b64 %rd1991, {%r2664, %r2663}; | |
ld.local.u64 %rd1992, [%rd191]; | |
add.s64 %rd1993, %rd1938, %rd1992; | |
add.s64 %rd1994, %rd1993, %rd1959; | |
xor.b64 %rd1995, %rd1994, %rd1924; | |
mov.b64 {%r2665, %r2666}, %rd1995; | |
mov.b64 %rd1996, {%r2666, %r2665}; | |
add.s64 %rd1997, %rd1996, %rd1909; | |
xor.b64 %rd1998, %rd1997, %rd1959; | |
mov.b64 {%r2667, %r2668}, %rd1998; | |
shr.u32 %r2669, %r2668, 24; | |
shl.b32 %r2670, %r2667, 8; | |
shr.u32 %r2671, %r2667, 24; | |
shl.b32 %r2672, %r2668, 8; | |
or.b32 %r2673, %r2669, %r2670; | |
or.b32 %r2674, %r2671, %r2672; | |
mov.b64 %rd1999, {%r2674, %r2673}; | |
ld.local.u64 %rd2000, [%rd192]; | |
add.s64 %rd2001, %rd1994, %rd2000; | |
add.s64 %rd2002, %rd2001, %rd1999; | |
xor.b64 %rd2003, %rd2002, %rd1996; | |
mov.b64 {%r2675, %r2676}, %rd2003; | |
shr.u32 %r2677, %r2676, 16; | |
shl.b32 %r2678, %r2675, 16; | |
shr.u32 %r2679, %r2675, 16; | |
shl.b32 %r2680, %r2676, 16; | |
or.b32 %r2681, %r2677, %r2678; | |
or.b32 %r2682, %r2679, %r2680; | |
mov.b64 %rd2004, {%r2682, %r2681}; | |
add.s64 %rd2005, %rd2004, %rd1997; | |
xor.b64 %rd2006, %rd2005, %rd1999; | |
mov.b64 {%r2683, %r2684}, %rd2006; | |
shr.u32 %r2685, %r2683, 31; | |
shl.b32 %r2686, %r2684, 1; | |
shr.u32 %r2687, %r2684, 31; | |
shl.b32 %r2688, %r2683, 1; | |
or.b32 %r2689, %r2685, %r2686; | |
or.b32 %r2690, %r2687, %r2688; | |
mov.b64 %rd2007, {%r2690, %r2689}; | |
ld.local.u64 %rd2008, [%rd193]; | |
add.s64 %rd2009, %rd1954, %rd2008; | |
add.s64 %rd2010, %rd2009, %rd1911; | |
xor.b64 %rd2011, %rd2010, %rd1940; | |
mov.b64 {%r2691, %r2692}, %rd2011; | |
mov.b64 %rd2012, {%r2692, %r2691}; | |
add.s64 %rd2013, %rd2012, %rd1925; | |
xor.b64 %rd2014, %rd2013, %rd1911; | |
mov.b64 {%r2693, %r2694}, %rd2014; | |
shr.u32 %r2695, %r2694, 24; | |
shl.b32 %r2696, %r2693, 8; | |
shr.u32 %r2697, %r2693, 24; | |
shl.b32 %r2698, %r2694, 8; | |
or.b32 %r2699, %r2695, %r2696; | |
or.b32 %r2700, %r2697, %r2698; | |
mov.b64 %rd2015, {%r2700, %r2699}; | |
ld.local.u64 %rd2016, [%rd194]; | |
add.s64 %rd2017, %rd2010, %rd2016; | |
add.s64 %rd2018, %rd2017, %rd2015; | |
xor.b64 %rd2019, %rd2018, %rd2012; | |
mov.b64 {%r2701, %r2702}, %rd2019; | |
shr.u32 %r2703, %r2702, 16; | |
shl.b32 %r2704, %r2701, 16; | |
shr.u32 %r2705, %r2701, 16; | |
shl.b32 %r2706, %r2702, 16; | |
or.b32 %r2707, %r2703, %r2704; | |
or.b32 %r2708, %r2705, %r2706; | |
mov.b64 %rd2020, {%r2708, %r2707}; | |
add.s64 %rd2021, %rd2020, %rd2013; | |
xor.b64 %rd2022, %rd2021, %rd2015; | |
mov.b64 {%r2709, %r2710}, %rd2022; | |
shr.u32 %r2711, %r2709, 31; | |
shl.b32 %r2712, %r2710, 1; | |
shr.u32 %r2713, %r2710, 31; | |
shl.b32 %r2714, %r2709, 1; | |
or.b32 %r2715, %r2711, %r2712; | |
or.b32 %r2716, %r2713, %r2714; | |
mov.b64 %rd2023, {%r2716, %r2715}; | |
xor.b64 %rd2024, %rd1970, %rd480; | |
xor.b64 %rd2025, %rd2024, %rd2005; | |
st.local.u64 [%rd1], %rd2025; | |
xor.b64 %rd2026, %rd1986, %rd499; | |
xor.b64 %rd198, %rd2026, %rd2021; | |
st.local.u64 [%rd1+8], %rd198; | |
xor.b64 %rd2027, %rd2002, %rd517; | |
xor.b64 %rd199, %rd2027, %rd1973; | |
st.local.u64 [%rd1+16], %rd199; | |
xor.b64 %rd2028, %rd2018, %rd535; | |
xor.b64 %rd200, %rd2028, %rd1989; | |
st.local.u64 [%rd1+24], %rd200; | |
xor.b64 %rd2029, %rd1988, %rd479; | |
xor.b64 %rd201, %rd2029, %rd2023; | |
st.local.u64 [%rd1+32], %rd201; | |
xor.b64 %rd2030, %rd2004, %rd498; | |
xor.b64 %rd202, %rd2030, %rd1975; | |
st.local.u64 [%rd1+40], %rd202; | |
xor.b64 %rd2031, %rd2020, %rd516; | |
xor.b64 %rd203, %rd2031, %rd1991; | |
st.local.u64 [%rd1+48], %rd203; | |
xor.b64 %rd2032, %rd1972, %rd534; | |
xor.b64 %rd2033, %rd2032, %rd2007; | |
st.local.u64 [%rd1+56], %rd2033; | |
ld.local.u8 %rs7, [%rd2056+1]; | |
ld.local.u8 %rs8, [%rd2056+2]; | |
ld.local.u8 %rs9, [%rd2056+3]; | |
ld.local.u8 %rs10, [%rd2056+4]; | |
ld.local.u8 %rs11, [%rd2056+5]; | |
ld.local.u8 %rs12, [%rd2056+6]; | |
ld.local.u8 %rs13, [%rd2056+8]; | |
ld.local.u8 %rs14, [%rd2056+9]; | |
ld.local.u8 %rs15, [%rd2056+10]; | |
ld.local.u8 %rs16, [%rd2056+11]; | |
ld.local.u8 %rs17, [%rd2056+12]; | |
ld.local.u8 %rs18, [%rd2056+13]; | |
ld.local.u8 %rs19, [%rd2056+14]; | |
ld.local.u8 %rs20, [%rd2056+16]; | |
ld.local.u8 %rs21, [%rd2056+17]; | |
ld.local.u8 %rs22, [%rd2056+18]; | |
ld.local.u8 %rs23, [%rd2056+19]; | |
ld.local.u8 %rs24, [%rd2056+20]; | |
ld.local.u8 %rs25, [%rd2056+21]; | |
ld.local.u8 %rs26, [%rd2056+22]; | |
ld.local.u8 %rs27, [%rd2056+24]; | |
ld.local.u8 %rs28, [%rd2056+25]; | |
ld.local.u8 %rs29, [%rd2056+26]; | |
ld.local.u8 %rs30, [%rd2056+27]; | |
ld.local.u8 %rs31, [%rd2056+28]; | |
ld.local.u8 %rs32, [%rd2056+29]; | |
ld.local.u8 %rs33, [%rd2056+30]; | |
ld.local.u8 %rs34, [%rd2056+32]; | |
ld.local.u8 %rs35, [%rd2056+33]; | |
ld.local.u8 %rs36, [%rd2056+34]; | |
ld.local.u8 %rs37, [%rd2056+35]; | |
ld.local.u8 %rs38, [%rd2056+36]; | |
ld.local.u8 %rs39, [%rd2056+37]; | |
ld.local.u8 %rs40, [%rd2056+38]; | |
ld.local.u8 %rs41, [%rd2056+40]; | |
ld.local.u8 %rs42, [%rd2056+41]; | |
ld.local.u8 %rs43, [%rd2056+42]; | |
ld.local.u8 %rs44, [%rd2056+43]; | |
ld.local.u8 %rs45, [%rd2056+44]; | |
ld.local.u8 %rs46, [%rd2056+45]; | |
ld.local.u8 %rs47, [%rd2056+46]; | |
ld.local.u8 %rs48, [%rd2056+48]; | |
and.b64 %rd2034, %rd2025, 255; | |
shl.b64 %rd2035, %rd2034, 8; | |
ld.local.u8 %rd2036, [%rd2056]; | |
or.b64 %rd204, %rd2035, %rd2036; | |
shl.b64 %rd2037, %rd204, 2; | |
add.s64 %rd2038, %rd209, %rd2037; | |
atom.global.add.u32 %r7, [%rd2038], 1; | |
setp.gt.u32 %p4, %r7, 63; | |
@%p4 bra BB1_7; | |
shl.b32 %r2734, %r2736, 1; | |
shr.u16 %rs59, %rs7, 4; | |
cvt.u32.u16 %r2717, %rs59; | |
bfe.u32 %r2718, %r2736, 5, 26; | |
and.b32 %r2719, %r2734, 62; | |
shl.b32 %r2720, %r2719, 16; | |
or.b32 %r2721, %r2720, %r2718; | |
shl.b32 %r2722, %r2717, 28; | |
or.b32 %r2723, %r2721, %r2722; | |
mul.lo.s64 %rd2039, %rd204, 1792; | |
add.s64 %rd2040, %rd208, %rd2039; | |
mul.wide.u32 %rd2041, %r7, 28; | |
add.s64 %rd2042, %rd2040, %rd2041; | |
st.global.u32 [%rd2042], %r2723; | |
st.global.u8 [%rd2042+5], %rs7; | |
st.global.v2.u8 [%rd2042+6], {%rs8, %rs9}; | |
cvt.u16.u64 %rs60, %rd198; | |
st.global.v4.u8 [%rd2042+8], {%rs10, %rs11, %rs12, %rs60}; | |
st.global.v4.u8 [%rd2042+12], {%rs13, %rs14, %rs15, %rs16}; | |
cvt.u16.u64 %rs61, %rd199; | |
st.global.v4.u8 [%rd2042+16], {%rs17, %rs18, %rs19, %rs61}; | |
st.global.v4.u8 [%rd2042+20], {%rs20, %rs21, %rs22, %rs23}; | |
cvt.u16.u64 %rs62, %rd200; | |
st.global.v4.u8 [%rd2042+24], {%rs24, %rs25, %rs26, %rs62}; | |
BB1_7: | |
cvt.u64.u16 %rd2043, %rs28; | |
and.b64 %rd2044, %rd2043, 255; | |
cvt.u32.u16 %r2724, %rs27; | |
and.b32 %r2725, %r2724, 255; | |
mul.wide.u32 %rd2045, %r2725, 256; | |
or.b64 %rd205, %rd2045, %rd2044; | |
shl.b64 %rd2046, %rd205, 2; | |
add.s64 %rd2047, %rd209, %rd2046; | |
atom.global.add.u32 %r8, [%rd2047], 1; | |
setp.gt.u32 %p5, %r8, 63; | |
@%p5 bra BB1_9; | |
shl.b32 %r2735, %r2736, 1; | |
shr.u16 %rs63, %rs29, 4; | |
cvt.u32.u16 %r2726, %rs63; | |
add.s32 %r2727, %r2735, 1; | |
shr.u32 %r2728, %r2727, 6; | |
and.b32 %r2729, %r2727, 63; | |
shl.b32 %r2730, %r2729, 16; | |
or.b32 %r2731, %r2730, %r2728; | |
shl.b32 %r2732, %r2726, 28; | |
or.b32 %r2733, %r2731, %r2732; | |
mul.lo.s64 %rd2048, %rd205, 1792; | |
add.s64 %rd2049, %rd208, %rd2048; | |
mul.wide.u32 %rd2050, %r8, 28; | |
add.s64 %rd2051, %rd2049, %rd2050; | |
st.global.u32 [%rd2051], %r2733; | |
st.global.u8 [%rd2051+5], %rs29; | |
st.global.v2.u8 [%rd2051+6], {%rs30, %rs31}; | |
cvt.u16.u64 %rs64, %rd201; | |
st.global.v4.u8 [%rd2051+8], {%rs32, %rs33, %rs64, %rs34}; | |
st.global.v4.u8 [%rd2051+12], {%rs35, %rs36, %rs37, %rs38}; | |
cvt.u16.u64 %rs65, %rd202; | |
st.global.v4.u8 [%rd2051+16], {%rs39, %rs40, %rs65, %rs41}; | |
st.global.v4.u8 [%rd2051+20], {%rs42, %rs43, %rs44, %rs45}; | |
cvt.u16.u64 %rs66, %rd203; | |
st.global.v4.u8 [%rd2051+24], {%rs46, %rs47, %rs66, %rs48}; | |
BB1_9: | |
and.b64 %rd2052, %rd2057, 4294967295; | |
add.s64 %rd2057, %rd195, %rd2052; | |
cvt.u32.u64 %r2736, %rd2057; | |
setp.lt.u32 %p6, %r2736, 1048576; | |
@%p6 bra BB1_2; | |
BB1_10: | |
ret; | |
} | |
// .globl digitOdd | |
.entry digitOdd( | |
.param .u32 digitOdd_param_0, | |
.param .u64 .ptr .global .align 4 digitOdd_param_1, | |
.param .u64 .ptr .global .align 4 digitOdd_param_2, | |
.param .u64 .ptr .global .align 4 digitOdd_param_3 | |
) | |
{ | |
.local .align 8 .b8 __local_depot2[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<13>; | |
.reg .b16 %rs<14>; | |
.reg .b32 %r<95>; | |
.reg .b64 %rd<110>; | |
mov.u64 %rd109, __local_depot2; | |
cvta.local.u64 %SP, %rd109; | |
ld.param.u32 %r21, [digitOdd_param_0]; | |
ld.param.u64 %rd35, [digitOdd_param_1]; | |
ld.param.u64 %rd36, [digitOdd_param_2]; | |
ld.param.u64 %rd37, [digitOdd_param_3]; | |
add.u64 %rd38, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd38; | |
setp.eq.s32 %p1, %r21, 0; | |
mov.u32 %r88, 0; | |
mov.u32 %r94, %r88; | |
mov.u32 %r87, %r88; | |
@%p1 bra BB2_2; | |
mul.lo.s32 %r25, %r21, -20; | |
add.s32 %r26, %r25, 187; | |
shr.u32 %r27, %r26, 3; | |
add.s32 %r28, %r27, 3; | |
shr.u32 %r29, %r28, 2; | |
add.s32 %r30, %r25, 207; | |
shr.u32 %r31, %r30, 3; | |
add.s32 %r32, %r31, 3; | |
shr.u32 %r87, %r32, 2; | |
shl.b32 %r33, %r87, 2; | |
sub.s32 %r88, %r33, %r31; | |
sub.s32 %r94, %r87, %r29; | |
BB2_2: | |
mov.u32 %r5, %r94; | |
mov.u32 %r34, %ctaid.x; | |
mov.u32 %r7, %ntid.x; | |
mov.b32 %r35, %envreg3; | |
mad.lo.s32 %r36, %r34, %r7, %r35; | |
mov.u32 %r37, %tid.x; | |
add.s32 %r89, %r36, %r37; | |
setp.gt.u32 %p2, %r89, 65535; | |
@%p2 bra BB2_17; | |
cvt.s64.s32 %rd105, %r89; | |
not.b32 %r38, %r21; | |
add.s32 %r39, %r21, -1; | |
shr.u32 %r40, %r39, 1; | |
cvt.u64.u32 %rd39, %r40; | |
mul.wide.u32 %rd40, %r40, 4; | |
add.s64 %rd3, %rd35, %rd40; | |
and.b32 %r41, %r38, 1; | |
cvt.u64.u32 %rd4, %r41; | |
mov.b32 %r42, %envreg6; | |
mul.lo.s32 %r43, %r7, %r42; | |
cvt.s64.s32 %rd5, %r43; | |
add.s32 %r44, %r87, -1; | |
cvt.u64.u32 %rd6, %r44; | |
cvt.u64.u32 %rd7, %r88; | |
add.s32 %r45, %r88, 1; | |
cvt.u64.u32 %rd8, %r45; | |
add.s32 %r46, %r88, 2; | |
cvt.u64.u32 %rd9, %r46; | |
shr.u32 %r47, %r21, 1; | |
mul.wide.u32 %rd41, %r47, 4; | |
add.s64 %rd10, %rd36, %rd41; | |
cvt.u64.u32 %rd42, %r5; | |
add.s64 %rd43, %rd42, %rd39; | |
shl.b64 %rd44, %rd43, 2; | |
add.s64 %rd45, %rd44, %rd35; | |
add.s64 %rd11, %rd45, 4; | |
add.s64 %rd12, %rd10, 4; | |
shl.b64 %rd46, %rd4, 18; | |
add.s64 %rd47, %rd37, %rd46; | |
BB2_4: | |
mov.u16 %rs3, 0; | |
st.local.v4.u8 [%rd1], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+4], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+8], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+12], {%rs3, %rs3, %rs3, %rs3}; | |
and.b64 %rd15, %rd105, 4294967295; | |
shl.b64 %rd48, %rd15, 2; | |
add.s64 %rd49, %rd47, %rd48; | |
ld.global.u32 %r48, [%rd49]; | |
mov.u32 %r49, 64; | |
min.u32 %r10, %r48, %r49; | |
mov.u32 %r90, 0; | |
st.global.u32 [%rd49], %r90; | |
setp.eq.s32 %p3, %r10, 0; | |
@%p3 bra BB2_16; | |
cvt.u32.u64 %r52, %rd105; | |
mul.wide.u32 %rd50, %r52, 448; | |
shl.b64 %rd51, %rd50, 2; | |
add.s64 %rd16, %rd11, %rd51; | |
BB2_6: | |
cvt.u64.u32 %rd17, %r90; | |
mul.lo.s64 %rd52, %rd15, 1792; | |
add.s64 %rd53, %rd3, %rd52; | |
mul.wide.u32 %rd54, %r90, 28; | |
add.s64 %rd55, %rd53, %rd54; | |
ld.global.u32 %r53, [%rd55]; | |
shr.u32 %r54, %r53, 28; | |
cvt.u64.u32 %rd18, %r54; | |
add.s64 %rd56, %rd1, %rd18; | |
ld.local.u8 %rs1, [%rd56]; | |
add.s16 %rs4, %rs1, 1; | |
st.local.u8 [%rd56], %rs4; | |
cvt.u32.u16 %r55, %rs1; | |
st.local.u32 [%rd1+284], %r55; | |
setp.gt.u16 %p4, %rs1, 15; | |
@%p4 bra BB2_15; | |
add.u64 %rd103, %SP, 0; | |
cvt.u64.u16 %rd57, %rs1; | |
shl.b64 %rd58, %rd18, 4; | |
add.s64 %rd60, %rd103, %rd58; | |
add.s64 %rd61, %rd60, 16; | |
st.local.u64 [%rd1+272], %rd61; | |
add.s64 %rd62, %rd1, %rd58; | |
add.s64 %rd63, %rd62, %rd57; | |
st.local.u8 [%rd63+16], %r90; | |
mov.u32 %r91, 0; | |
st.local.u32 [%rd1+280], %r91; | |
ld.local.u32 %r57, [%rd1+284]; | |
setp.eq.s32 %p5, %r57, 0; | |
@%p5 bra BB2_15; | |
mul.wide.s32 %rd64, %r90, 7; | |
shl.b64 %rd65, %rd64, 2; | |
add.s64 %rd19, %rd16, %rd65; | |
mul.lo.s64 %rd68, %rd17, 28; | |
add.s64 %rd69, %rd53, %rd68; | |
add.s64 %rd70, %rd69, 4; | |
shl.b64 %rd71, %rd6, 2; | |
add.s64 %rd20, %rd70, %rd71; | |
add.s64 %rd21, %rd70, %rd7; | |
add.s64 %rd22, %rd70, %rd8; | |
add.s64 %rd23, %rd70, %rd9; | |
shl.b32 %r59, %r90, 22; | |
or.b32 %r12, %r59, %r89; | |
BB2_9: | |
mov.u32 %r13, %r91; | |
add.s32 %r60, %r13, 1; | |
st.local.u32 [%rd1+280], %r60; | |
ld.local.u64 %rd72, [%rd1+272]; | |
cvt.u64.u32 %rd73, %r13; | |
add.s64 %rd74, %rd72, %rd73; | |
ld.u8 %rs2, [%rd74]; | |
cvt.u64.u16 %rd75, %rs2; | |
and.b64 %rd24, %rd75, 255; | |
cvt.u32.u16 %r61, %rs2; | |
and.b32 %r62, %r61, 255; | |
mul.wide.u32 %rd78, %r62, 28; | |
add.s64 %rd79, %rd53, %rd78; | |
add.s64 %rd81, %rd79, %rd71; | |
ld.global.u32 %r63, [%rd20]; | |
ld.global.u32 %r64, [%rd81+4]; | |
setp.eq.s32 %p6, %r64, %r63; | |
@%p6 bra BB2_14; | |
ld.param.u64 %rd104, [digitOdd_param_3]; | |
mul.lo.s64 %rd84, %rd24, 28; | |
add.s64 %rd85, %rd53, %rd84; | |
add.s64 %rd86, %rd85, 4; | |
add.s64 %rd87, %rd86, %rd7; | |
ld.global.u8 %rs5, [%rd21]; | |
ld.global.u8 %rs6, [%rd87]; | |
xor.b16 %rs7, %rs5, %rs6; | |
cvt.u32.u16 %r65, %rs7; | |
and.b32 %r66, %r65, 15; | |
add.s64 %rd88, %rd86, %rd8; | |
ld.global.u8 %rs8, [%rd22]; | |
ld.global.u8 %rs9, [%rd88]; | |
xor.b16 %rs10, %rs8, %rs9; | |
cvt.u32.u16 %r67, %rs10; | |
bfi.b32 %r68, %r66, %r67, 8, 24; | |
shl.b32 %r69, %r68, 4; | |
add.s64 %rd89, %rd86, %rd9; | |
ld.global.u8 %rs11, [%rd23]; | |
ld.global.u8 %rs12, [%rd89]; | |
xor.b16 %rs13, %rs11, %rs12; | |
cvt.u32.u16 %r70, %rs13; | |
and.b32 %r14, %r70, 255; | |
bfe.u32 %r71, %r70, 4, 4; | |
or.b32 %r72, %r71, %r69; | |
cvt.u64.u32 %rd25, %r72; | |
mul.wide.u32 %rd90, %r72, 4; | |
add.s64 %rd91, %rd104, %rd90; | |
add.s64 %rd92, %rd91, 262144; | |
atom.global.add.u32 %r15, [%rd92], 1; | |
setp.gt.u32 %p7, %r15, 63; | |
@%p7 bra BB2_14; | |
shl.b32 %r75, %r62, 16; | |
or.b32 %r76, %r12, %r75; | |
shl.b32 %r77, %r14, 28; | |
or.b32 %r78, %r76, %r77; | |
mul.lo.s64 %rd93, %rd25, 1792; | |
add.s64 %rd94, %rd10, %rd93; | |
mul.wide.u32 %rd95, %r15, 28; | |
add.s64 %rd96, %rd94, %rd95; | |
st.global.u32 [%rd96], %r78; | |
setp.ge.u32 %p8, %r5, %r87; | |
@%p8 bra BB2_14; | |
cvt.u32.u64 %r79, %rd25; | |
mul.lo.s64 %rd97, %rd24, 7; | |
shl.b64 %rd98, %rd97, 2; | |
add.s64 %rd107, %rd16, %rd98; | |
mul.wide.u32 %rd99, %r79, 448; | |
mul.wide.u32 %rd100, %r15, 7; | |
add.s64 %rd101, %rd99, %rd100; | |
shl.b64 %rd102, %rd101, 2; | |
add.s64 %rd106, %rd12, %rd102; | |
mov.u64 %rd108, %rd19; | |
mov.u32 %r93, %r5; | |
BB2_13: | |
mov.u32 %r16, %r93; | |
mov.u64 %rd30, %rd108; | |
ld.global.u32 %r80, [%rd30]; | |
ld.global.u32 %r81, [%rd107]; | |
xor.b32 %r82, %r80, %r81; | |
st.global.u32 [%rd106], %r82; | |
add.s64 %rd31, %rd30, 4; | |
add.s64 %rd107, %rd107, 4; | |
add.s64 %rd106, %rd106, 4; | |
add.s32 %r17, %r16, 1; | |
setp.lt.u32 %p9, %r17, %r87; | |
mov.u64 %rd108, %rd31; | |
mov.u32 %r93, %r17; | |
@%p9 bra BB2_13; | |
BB2_14: | |
ld.local.v2.u32 {%r83, %r84}, [%rd1+280]; | |
mov.u32 %r91, %r83; | |
setp.lt.u32 %p10, %r83, %r84; | |
@%p10 bra BB2_9; | |
BB2_15: | |
cvt.u32.u64 %r86, %rd17; | |
add.s32 %r90, %r86, 1; | |
setp.lt.u32 %p11, %r90, %r10; | |
@%p11 bra BB2_6; | |
BB2_16: | |
add.s64 %rd105, %rd5, %rd15; | |
cvt.u32.u64 %r89, %rd105; | |
setp.lt.u32 %p12, %r89, 65536; | |
@%p12 bra BB2_4; | |
BB2_17: | |
ret; | |
} | |
// .globl digitEven | |
.entry digitEven( | |
.param .u32 digitEven_param_0, | |
.param .u64 .ptr .global .align 4 digitEven_param_1, | |
.param .u64 .ptr .global .align 4 digitEven_param_2, | |
.param .u64 .ptr .global .align 4 digitEven_param_3 | |
) | |
{ | |
.local .align 8 .b8 __local_depot3[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<13>; | |
.reg .b16 %rs<15>; | |
.reg .b32 %r<88>; | |
.reg .b64 %rd<112>; | |
mov.u64 %rd111, __local_depot3; | |
cvta.local.u64 %SP, %rd111; | |
ld.param.u32 %r21, [digitEven_param_0]; | |
ld.param.u64 %rd35, [digitEven_param_1]; | |
ld.param.u64 %rd36, [digitEven_param_2]; | |
ld.param.u64 %rd37, [digitEven_param_3]; | |
add.u64 %rd38, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd38; | |
setp.eq.s32 %p1, %r21, 0; | |
mov.u32 %r81, 0; | |
mov.u32 %r87, %r81; | |
mov.u32 %r80, %r81; | |
@%p1 bra BB3_2; | |
mul.lo.s32 %r25, %r21, -20; | |
add.s32 %r26, %r25, 187; | |
shr.u32 %r27, %r26, 3; | |
add.s32 %r28, %r27, 3; | |
shr.u32 %r29, %r28, 2; | |
add.s32 %r30, %r25, 207; | |
shr.u32 %r31, %r30, 3; | |
add.s32 %r32, %r31, 3; | |
shr.u32 %r80, %r32, 2; | |
shl.b32 %r33, %r80, 2; | |
sub.s32 %r81, %r33, %r31; | |
sub.s32 %r87, %r80, %r29; | |
BB3_2: | |
mov.u32 %r5, %r87; | |
mov.u32 %r34, %ctaid.x; | |
mov.u32 %r7, %ntid.x; | |
mov.b32 %r35, %envreg3; | |
mad.lo.s32 %r36, %r34, %r7, %r35; | |
mov.u32 %r37, %tid.x; | |
add.s32 %r82, %r36, %r37; | |
setp.gt.u32 %p2, %r82, 65535; | |
@%p2 bra BB3_17; | |
cvt.s64.s32 %rd107, %r82; | |
not.b32 %r38, %r21; | |
add.s32 %r39, %r21, -1; | |
shr.u32 %r40, %r39, 1; | |
cvt.u64.u32 %rd39, %r40; | |
mul.wide.u32 %rd40, %r40, 4; | |
add.s64 %rd3, %rd36, %rd40; | |
and.b32 %r41, %r38, 1; | |
cvt.u64.u32 %rd4, %r41; | |
mov.b32 %r42, %envreg6; | |
mul.lo.s32 %r43, %r7, %r42; | |
cvt.s64.s32 %rd5, %r43; | |
add.s32 %r44, %r80, -1; | |
cvt.u64.u32 %rd6, %r44; | |
cvt.u64.u32 %rd7, %r81; | |
add.s32 %r45, %r81, 1; | |
cvt.u64.u32 %rd8, %r45; | |
add.s32 %r46, %r81, 2; | |
cvt.u64.u32 %rd9, %r46; | |
shr.u32 %r47, %r21, 1; | |
mul.wide.u32 %rd41, %r47, 4; | |
add.s64 %rd10, %rd35, %rd41; | |
cvt.u64.u32 %rd42, %r5; | |
add.s64 %rd43, %rd42, %rd39; | |
shl.b64 %rd44, %rd43, 2; | |
add.s64 %rd45, %rd44, %rd36; | |
add.s64 %rd11, %rd45, 4; | |
add.s64 %rd12, %rd10, 4; | |
shl.b64 %rd46, %rd4, 18; | |
add.s64 %rd47, %rd37, %rd46; | |
BB3_4: | |
mov.u16 %rs4, 0; | |
st.local.v4.u8 [%rd1], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+4], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+8], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+12], {%rs4, %rs4, %rs4, %rs4}; | |
and.b64 %rd15, %rd107, 4294967295; | |
shl.b64 %rd48, %rd15, 2; | |
add.s64 %rd49, %rd47, %rd48; | |
ld.global.u32 %r48, [%rd49]; | |
mov.u32 %r49, 64; | |
min.u32 %r10, %r48, %r49; | |
mov.u32 %r83, 0; | |
st.global.u32 [%rd49], %r83; | |
setp.eq.s32 %p3, %r10, 0; | |
@%p3 bra BB3_16; | |
cvt.u32.u64 %r52, %rd107; | |
mul.wide.u32 %rd50, %r52, 448; | |
shl.b64 %rd51, %rd50, 2; | |
add.s64 %rd16, %rd11, %rd51; | |
BB3_6: | |
cvt.u64.u32 %rd17, %r83; | |
mul.lo.s64 %rd52, %rd15, 1792; | |
add.s64 %rd53, %rd3, %rd52; | |
mul.wide.u32 %rd54, %r83, 28; | |
add.s64 %rd55, %rd53, %rd54; | |
ld.global.u32 %r53, [%rd55]; | |
shr.u32 %r54, %r53, 28; | |
cvt.u64.u32 %rd18, %r54; | |
add.s64 %rd56, %rd1, %rd18; | |
ld.local.u8 %rs1, [%rd56]; | |
add.s16 %rs5, %rs1, 1; | |
st.local.u8 [%rd56], %rs5; | |
cvt.u32.u16 %r55, %rs1; | |
st.local.u32 [%rd1+284], %r55; | |
setp.gt.u16 %p4, %rs1, 15; | |
@%p4 bra BB3_15; | |
add.u64 %rd105, %SP, 0; | |
cvt.u64.u16 %rd57, %rs1; | |
shl.b64 %rd58, %rd18, 4; | |
add.s64 %rd60, %rd105, %rd58; | |
add.s64 %rd61, %rd60, 16; | |
st.local.u64 [%rd1+272], %rd61; | |
add.s64 %rd62, %rd1, %rd58; | |
add.s64 %rd63, %rd62, %rd57; | |
st.local.u8 [%rd63+16], %r83; | |
mov.u32 %r84, 0; | |
st.local.u32 [%rd1+280], %r84; | |
ld.local.u32 %r57, [%rd1+284]; | |
setp.eq.s32 %p5, %r57, 0; | |
@%p5 bra BB3_15; | |
mul.wide.s32 %rd64, %r83, 7; | |
shl.b64 %rd65, %rd64, 2; | |
add.s64 %rd19, %rd16, %rd65; | |
mul.lo.s64 %rd68, %rd17, 28; | |
add.s64 %rd69, %rd53, %rd68; | |
add.s64 %rd70, %rd69, 4; | |
shl.b64 %rd71, %rd6, 2; | |
add.s64 %rd20, %rd70, %rd71; | |
add.s64 %rd21, %rd70, %rd7; | |
add.s64 %rd22, %rd70, %rd8; | |
add.s64 %rd23, %rd70, %rd9; | |
shl.b32 %r59, %r83, 22; | |
or.b32 %r12, %r59, %r82; | |
BB3_9: | |
mov.u32 %r13, %r84; | |
add.s32 %r60, %r13, 1; | |
st.local.u32 [%rd1+280], %r60; | |
ld.local.u64 %rd72, [%rd1+272]; | |
cvt.u64.u32 %rd73, %r13; | |
add.s64 %rd74, %rd72, %rd73; | |
ld.u8 %rs2, [%rd74]; | |
cvt.u64.u16 %rd75, %rs2; | |
and.b64 %rd24, %rd75, 255; | |
cvt.u32.u16 %r61, %rs2; | |
and.b32 %r62, %r61, 255; | |
mul.wide.u32 %rd78, %r62, 28; | |
add.s64 %rd79, %rd53, %rd78; | |
add.s64 %rd81, %rd79, %rd71; | |
ld.global.u32 %r63, [%rd20]; | |
ld.global.u32 %r64, [%rd81+4]; | |
setp.eq.s32 %p6, %r64, %r63; | |
@%p6 bra BB3_14; | |
ld.param.u64 %rd106, [digitEven_param_3]; | |
mul.lo.s64 %rd84, %rd24, 28; | |
add.s64 %rd85, %rd53, %rd84; | |
add.s64 %rd86, %rd85, 4; | |
add.s64 %rd87, %rd86, %rd7; | |
ld.global.u8 %rs6, [%rd21]; | |
ld.global.u8 %rs7, [%rd87]; | |
xor.b16 %rs8, %rs6, %rs7; | |
cvt.u32.u16 %r66, %rs8; | |
and.b32 %r67, %r66, 255; | |
mul.wide.u32 %rd88, %r67, 256; | |
add.s64 %rd89, %rd86, %rd8; | |
ld.global.u8 %rs9, [%rd22]; | |
ld.global.u8 %rs10, [%rd89]; | |
xor.b16 %rs11, %rs9, %rs10; | |
cvt.u64.u16 %rd90, %rs11; | |
and.b64 %rd91, %rd90, 255; | |
or.b64 %rd25, %rd91, %rd88; | |
add.s64 %rd92, %rd86, %rd9; | |
ld.global.u8 %rs12, [%rd23]; | |
ld.global.u8 %rs13, [%rd92]; | |
xor.b16 %rs3, %rs12, %rs13; | |
shl.b64 %rd93, %rd25, 2; | |
add.s64 %rd94, %rd106, %rd93; | |
atom.global.add.u32 %r15, [%rd94], 1; | |
setp.gt.u32 %p7, %r15, 63; | |
@%p7 bra BB3_14; | |
shr.u16 %rs14, %rs3, 4; | |
cvt.u32.u16 %r68, %rs14; | |
shl.b32 %r69, %r68, 28; | |
shl.b32 %r70, %r62, 16; | |
or.b32 %r71, %r12, %r70; | |
or.b32 %r72, %r71, %r69; | |
mul.lo.s64 %rd95, %rd25, 1792; | |
add.s64 %rd96, %rd10, %rd95; | |
mul.wide.u32 %rd97, %r15, 28; | |
add.s64 %rd98, %rd96, %rd97; | |
st.global.u32 [%rd98], %r72; | |
setp.ge.u32 %p8, %r5, %r80; | |
@%p8 bra BB3_14; | |
mul.lo.s64 %rd99, %rd24, 7; | |
shl.b64 %rd100, %rd99, 2; | |
add.s64 %rd109, %rd16, %rd100; | |
mul.wide.u32 %rd101, %r15, 7; | |
mul.lo.s64 %rd102, %rd25, 448; | |
add.s64 %rd103, %rd102, %rd101; | |
shl.b64 %rd104, %rd103, 2; | |
add.s64 %rd108, %rd12, %rd104; | |
mov.u64 %rd110, %rd19; | |
mov.u32 %r86, %r5; | |
BB3_13: | |
mov.u32 %r16, %r86; | |
mov.u64 %rd30, %rd110; | |
ld.global.u32 %r73, [%rd30]; | |
ld.global.u32 %r74, [%rd109]; | |
xor.b32 %r75, %r73, %r74; | |
st.global.u32 [%rd108], %r75; | |
add.s64 %rd31, %rd30, 4; | |
add.s64 %rd109, %rd109, 4; | |
add.s64 %rd108, %rd108, 4; | |
add.s32 %r17, %r16, 1; | |
setp.lt.u32 %p9, %r17, %r80; | |
mov.u64 %rd110, %rd31; | |
mov.u32 %r86, %r17; | |
@%p9 bra BB3_13; | |
BB3_14: | |
ld.local.v2.u32 {%r76, %r77}, [%rd1+280]; | |
mov.u32 %r84, %r76; | |
setp.lt.u32 %p10, %r76, %r77; | |
@%p10 bra BB3_9; | |
BB3_15: | |
cvt.u32.u64 %r79, %rd17; | |
add.s32 %r83, %r79, 1; | |
setp.lt.u32 %p11, %r83, %r10; | |
@%p11 bra BB3_6; | |
BB3_16: | |
add.s64 %rd107, %rd5, %rd15; | |
cvt.u32.u64 %r82, %rd107; | |
setp.lt.u32 %p12, %r82, 65536; | |
@%p12 bra BB3_4; | |
BB3_17: | |
ret; | |
} | |
// .globl digit_1 | |
.entry digit_1( | |
.param .u64 .ptr .global .align 4 digit_1_param_0, | |
.param .u64 .ptr .global .align 4 digit_1_param_1, | |
.param .u64 .ptr .global .align 4 digit_1_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot4[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<14>; | |
.reg .b32 %r<70>; | |
.reg .b64 %rd<53>; | |
mov.u64 %rd52, __local_depot4; | |
cvta.local.u64 %SP, %rd52; | |
ld.param.u64 %rd12, [digit_1_param_0]; | |
ld.param.u64 %rd13, [digit_1_param_1]; | |
ld.param.u64 %rd14, [digit_1_param_2]; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r67, %r15, %r16; | |
setp.gt.u32 %p1, %r67, 65535; | |
@%p1 bra BB4_12; | |
cvt.s64.s32 %rd51, %r67; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd2, %r18; | |
BB4_2: | |
mov.u64 %rd3, %rd51; | |
add.u64 %rd15, %SP, 0; | |
cvta.to.local.u64 %rd16, %rd15; | |
mov.u16 %rs3, 0; | |
st.local.v4.u8 [%rd16], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd16+4], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd16+8], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd16+12], {%rs3, %rs3, %rs3, %rs3}; | |
and.b64 %rd4, %rd3, 4294967295; | |
shl.b64 %rd17, %rd4, 2; | |
add.s64 %rd18, %rd14, %rd17; | |
ld.global.u32 %r20, [%rd18]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r68, 0; | |
st.global.u32 [%rd18], %r68; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB4_11; | |
BB4_3: | |
cvt.u64.u32 %rd5, %r68; | |
mul.lo.s64 %rd21, %rd4, 1792; | |
add.s64 %rd22, %rd12, %rd21; | |
mul.wide.u32 %rd23, %r68, 28; | |
add.s64 %rd6, %rd22, %rd23; | |
ld.global.u32 %r22, [%rd6]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd7, %r23; | |
add.s64 %rd24, %rd16, %rd7; | |
ld.local.u8 %rs1, [%rd24]; | |
add.s16 %rs4, %rs1, 1; | |
st.local.u8 [%rd24], %rs4; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd16+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB4_10; | |
cvt.u64.u16 %rd25, %rs1; | |
shl.b64 %rd26, %rd7, 4; | |
add.s64 %rd28, %rd15, %rd26; | |
add.s64 %rd29, %rd28, 16; | |
st.local.u64 [%rd16+272], %rd29; | |
add.s64 %rd31, %rd16, %rd26; | |
add.s64 %rd32, %rd31, %rd25; | |
st.local.u8 [%rd32+16], %r68; | |
mov.u32 %r69, 0; | |
st.local.u32 [%rd16+280], %r69; | |
ld.local.u32 %r26, [%rd16+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB4_10; | |
shl.b32 %r28, %r68, 22; | |
or.b32 %r6, %r28, %r67; | |
add.s64 %rd8, %rd6, 4; | |
BB4_6: | |
mov.u32 %r7, %r69; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd16+280], %r29; | |
ld.local.u64 %rd35, [%rd16+272]; | |
cvt.u64.u32 %rd36, %r7; | |
add.s64 %rd37, %rd35, %rd36; | |
ld.u8 %rs2, [%rd37]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd40, %r31, 28; | |
add.s64 %rd41, %rd22, %rd40; | |
add.s64 %rd9, %rd41, 24; | |
ld.global.u32 %r32, [%rd6+24]; | |
ld.global.u32 %r33, [%rd41+24]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB4_9; | |
ld.global.u8 %rs5, [%rd8+1]; | |
ld.global.u8 %rs6, [%rd9+-19]; | |
xor.b16 %rs7, %rs5, %rs6; | |
cvt.u32.u16 %r34, %rs7; | |
and.b32 %r35, %r34, 15; | |
ld.global.u8 %rs8, [%rd8+2]; | |
ld.global.u8 %rs9, [%rd9+-18]; | |
xor.b16 %rs10, %rs8, %rs9; | |
cvt.u32.u16 %r36, %rs10; | |
bfi.b32 %r37, %r35, %r36, 8, 24; | |
shl.b32 %r38, %r37, 4; | |
ld.global.u8 %rs11, [%rd8+3]; | |
ld.global.u8 %rs12, [%rd9+-17]; | |
xor.b16 %rs13, %rs11, %rs12; | |
cvt.u32.u16 %r39, %rs13; | |
and.b32 %r8, %r39, 255; | |
bfe.u32 %r40, %r39, 4, 4; | |
or.b32 %r41, %r40, %r38; | |
cvt.u64.u32 %rd10, %r41; | |
mul.wide.u32 %rd42, %r41, 4; | |
add.s64 %rd43, %rd14, %rd42; | |
add.s64 %rd44, %rd43, 262144; | |
atom.global.add.u32 %r9, [%rd44], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB4_9; | |
shl.b32 %r44, %r31, 16; | |
or.b32 %r45, %r6, %r44; | |
shl.b32 %r46, %r8, 28; | |
or.b32 %r47, %r45, %r46; | |
mul.lo.s64 %rd45, %rd10, 1792; | |
add.s64 %rd46, %rd13, %rd45; | |
mul.wide.u32 %rd47, %r9, 28; | |
add.s64 %rd48, %rd46, %rd47; | |
st.global.u32 [%rd48], %r47; | |
ld.global.u32 %r48, [%rd6+8]; | |
ld.global.u32 %r49, [%rd9+-16]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd48+4], %r50; | |
ld.global.u32 %r51, [%rd6+12]; | |
ld.global.u32 %r52, [%rd9+-12]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd48+8], %r53; | |
ld.global.u32 %r54, [%rd6+16]; | |
ld.global.u32 %r55, [%rd9+-8]; | |
xor.b32 %r56, %r54, %r55; | |
st.global.u32 [%rd48+12], %r56; | |
ld.global.u32 %r57, [%rd6+20]; | |
ld.global.u32 %r58, [%rd9+-4]; | |
xor.b32 %r59, %r57, %r58; | |
st.global.u32 [%rd48+16], %r59; | |
ld.global.u32 %r60, [%rd6+24]; | |
ld.global.u32 %r61, [%rd9]; | |
xor.b32 %r62, %r60, %r61; | |
st.global.u32 [%rd48+20], %r62; | |
BB4_9: | |
ld.local.v2.u32 {%r63, %r64}, [%rd16+280]; | |
mov.u32 %r69, %r63; | |
setp.lt.u32 %p7, %r63, %r64; | |
@%p7 bra BB4_6; | |
BB4_10: | |
cvt.u32.u64 %r66, %rd5; | |
add.s32 %r68, %r66, 1; | |
setp.lt.u32 %p8, %r68, %r4; | |
@%p8 bra BB4_3; | |
BB4_11: | |
add.s64 %rd51, %rd2, %rd4; | |
cvt.u32.u64 %r67, %rd51; | |
setp.lt.u32 %p9, %r67, 65536; | |
@%p9 bra BB4_2; | |
BB4_12: | |
ret; | |
} | |
// .globl digit_2 | |
.entry digit_2( | |
.param .u64 .ptr .global .align 4 digit_2_param_0, | |
.param .u64 .ptr .global .align 4 digit_2_param_1, | |
.param .u64 .ptr .global .align 4 digit_2_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot5[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<15>; | |
.reg .b32 %r<64>; | |
.reg .b64 %rd<54>; | |
mov.u64 %rd53, __local_depot5; | |
cvta.local.u64 %SP, %rd53; | |
ld.param.u64 %rd11, [digit_2_param_0]; | |
ld.param.u64 %rd12, [digit_2_param_1]; | |
ld.param.u64 %rd13, [digit_2_param_2]; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r61, %r15, %r16; | |
setp.gt.u32 %p1, %r61, 65535; | |
@%p1 bra BB5_12; | |
cvt.s64.s32 %rd52, %r61; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd2, %r18; | |
BB5_2: | |
mov.u64 %rd3, %rd52; | |
add.u64 %rd14, %SP, 0; | |
cvta.to.local.u64 %rd15, %rd14; | |
mov.u16 %rs4, 0; | |
st.local.v4.u8 [%rd15], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd15+4], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd15+8], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd15+12], {%rs4, %rs4, %rs4, %rs4}; | |
and.b64 %rd4, %rd3, 4294967295; | |
shl.b64 %rd16, %rd4, 2; | |
add.s64 %rd17, %rd13, %rd16; | |
ld.global.u32 %r20, [%rd17+262144]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r62, 0; | |
st.global.u32 [%rd17+262144], %r62; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB5_11; | |
BB5_3: | |
cvt.u64.u32 %rd5, %r62; | |
mul.lo.s64 %rd20, %rd4, 1792; | |
add.s64 %rd21, %rd12, %rd20; | |
mul.wide.u32 %rd22, %r62, 28; | |
add.s64 %rd6, %rd21, %rd22; | |
ld.global.u32 %r22, [%rd6]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd7, %r23; | |
add.s64 %rd23, %rd15, %rd7; | |
ld.local.u8 %rs1, [%rd23]; | |
add.s16 %rs5, %rs1, 1; | |
st.local.u8 [%rd23], %rs5; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd15+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB5_10; | |
cvt.u64.u16 %rd24, %rs1; | |
shl.b64 %rd25, %rd7, 4; | |
add.s64 %rd27, %rd14, %rd25; | |
add.s64 %rd28, %rd27, 16; | |
st.local.u64 [%rd15+272], %rd28; | |
add.s64 %rd30, %rd15, %rd25; | |
add.s64 %rd31, %rd30, %rd24; | |
st.local.u8 [%rd31+16], %r62; | |
mov.u32 %r63, 0; | |
st.local.u32 [%rd15+280], %r63; | |
ld.local.u32 %r26, [%rd15+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB5_10; | |
shl.b32 %r28, %r62, 22; | |
or.b32 %r6, %r28, %r61; | |
BB5_6: | |
mov.u32 %r7, %r63; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd15+280], %r29; | |
ld.local.u64 %rd34, [%rd15+272]; | |
cvt.u64.u32 %rd35, %r7; | |
add.s64 %rd36, %rd34, %rd35; | |
ld.u8 %rs2, [%rd36]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd39, %r31, 28; | |
add.s64 %rd40, %rd21, %rd39; | |
add.s64 %rd8, %rd40, 20; | |
ld.global.u32 %r32, [%rd6+20]; | |
ld.global.u32 %r33, [%rd40+20]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB5_9; | |
ld.global.u8 %rs6, [%rd6+4]; | |
ld.global.u8 %rs7, [%rd8+-16]; | |
xor.b16 %rs8, %rs6, %rs7; | |
cvt.u32.u16 %r35, %rs8; | |
and.b32 %r36, %r35, 255; | |
mul.wide.u32 %rd41, %r36, 256; | |
ld.global.u8 %rs9, [%rd6+5]; | |
ld.global.u8 %rs10, [%rd8+-15]; | |
xor.b16 %rs11, %rs9, %rs10; | |
cvt.u64.u16 %rd42, %rs11; | |
and.b64 %rd43, %rd42, 255; | |
or.b64 %rd9, %rd43, %rd41; | |
ld.global.u8 %rs12, [%rd6+6]; | |
ld.global.u8 %rs13, [%rd8+-14]; | |
xor.b16 %rs3, %rs12, %rs13; | |
shl.b64 %rd44, %rd9, 2; | |
add.s64 %rd45, %rd13, %rd44; | |
atom.global.add.u32 %r9, [%rd45], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB5_9; | |
mul.lo.s64 %rd46, %rd9, 1792; | |
add.s64 %rd47, %rd11, %rd46; | |
shr.u16 %rs14, %rs3, 4; | |
cvt.u32.u16 %r37, %rs14; | |
shl.b32 %r38, %r37, 28; | |
shl.b32 %r39, %r31, 16; | |
or.b32 %r40, %r6, %r39; | |
or.b32 %r41, %r40, %r38; | |
mul.wide.u32 %rd48, %r9, 28; | |
add.s64 %rd49, %rd47, %rd48; | |
st.global.u32 [%rd49+4], %r41; | |
ld.global.u32 %r42, [%rd6+4]; | |
ld.global.u32 %r43, [%rd8+-16]; | |
xor.b32 %r44, %r42, %r43; | |
st.global.u32 [%rd49+8], %r44; | |
ld.global.u32 %r45, [%rd6+8]; | |
ld.global.u32 %r46, [%rd8+-12]; | |
xor.b32 %r47, %r45, %r46; | |
st.global.u32 [%rd49+12], %r47; | |
ld.global.u32 %r48, [%rd6+12]; | |
ld.global.u32 %r49, [%rd8+-8]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd49+16], %r50; | |
ld.global.u32 %r51, [%rd6+16]; | |
ld.global.u32 %r52, [%rd8+-4]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd49+20], %r53; | |
ld.global.u32 %r54, [%rd6+20]; | |
ld.global.u32 %r55, [%rd8]; | |
xor.b32 %r56, %r54, %r55; | |
st.global.u32 [%rd49+24], %r56; | |
BB5_9: | |
ld.local.v2.u32 {%r57, %r58}, [%rd15+280]; | |
mov.u32 %r63, %r57; | |
setp.lt.u32 %p7, %r57, %r58; | |
@%p7 bra BB5_6; | |
BB5_10: | |
cvt.u32.u64 %r60, %rd5; | |
add.s32 %r62, %r60, 1; | |
setp.lt.u32 %p8, %r62, %r4; | |
@%p8 bra BB5_3; | |
BB5_11: | |
add.s64 %rd52, %rd2, %rd4; | |
cvt.u32.u64 %r61, %rd52; | |
setp.lt.u32 %p9, %r61, 65536; | |
@%p9 bra BB5_2; | |
BB5_12: | |
ret; | |
} | |
// .globl digit_3 | |
.entry digit_3( | |
.param .u64 .ptr .global .align 4 digit_3_param_0, | |
.param .u64 .ptr .global .align 4 digit_3_param_1, | |
.param .u64 .ptr .global .align 4 digit_3_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot6[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<14>; | |
.reg .b32 %r<67>; | |
.reg .b64 %rd<49>; | |
mov.u64 %rd48, __local_depot6; | |
cvta.local.u64 %SP, %rd48; | |
ld.param.u64 %rd16, [digit_3_param_0]; | |
ld.param.u64 %rd17, [digit_3_param_1]; | |
ld.param.u64 %rd18, [digit_3_param_2]; | |
add.u64 %rd19, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd19; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r64, %r15, %r16; | |
setp.gt.u32 %p1, %r64, 65535; | |
@%p1 bra BB6_12; | |
cvt.s64.s32 %rd47, %r64; | |
add.s64 %rd3, %rd16, 4; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd4, %r18; | |
add.s64 %rd5, %rd17, 4; | |
BB6_2: | |
mov.u64 %rd6, %rd47; | |
mov.u16 %rs3, 0; | |
st.local.v4.u8 [%rd1], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+4], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+8], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+12], {%rs3, %rs3, %rs3, %rs3}; | |
and.b64 %rd8, %rd6, 4294967295; | |
shl.b64 %rd20, %rd8, 2; | |
add.s64 %rd21, %rd18, %rd20; | |
ld.global.u32 %r20, [%rd21]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r65, 0; | |
st.global.u32 [%rd21], %r65; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB6_11; | |
BB6_3: | |
cvt.u64.u32 %rd9, %r65; | |
mul.lo.s64 %rd22, %rd8, 1792; | |
add.s64 %rd23, %rd3, %rd22; | |
mul.wide.u32 %rd24, %r65, 28; | |
add.s64 %rd10, %rd23, %rd24; | |
ld.global.u32 %r22, [%rd10]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd11, %r23; | |
add.s64 %rd25, %rd1, %rd11; | |
ld.local.u8 %rs1, [%rd25]; | |
add.s16 %rs4, %rs1, 1; | |
st.local.u8 [%rd25], %rs4; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd1+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB6_10; | |
cvt.u64.u16 %rd26, %rs1; | |
shl.b64 %rd27, %rd11, 4; | |
add.s64 %rd29, %rd19, %rd27; | |
add.s64 %rd30, %rd29, 16; | |
st.local.u64 [%rd1+272], %rd30; | |
add.s64 %rd31, %rd1, %rd27; | |
add.s64 %rd32, %rd31, %rd26; | |
st.local.u8 [%rd32+16], %r65; | |
mov.u32 %r66, 0; | |
st.local.u32 [%rd1+280], %r66; | |
ld.local.u32 %r26, [%rd1+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB6_10; | |
shl.b32 %r28, %r65, 22; | |
or.b32 %r6, %r28, %r64; | |
add.s64 %rd12, %rd10, 4; | |
BB6_6: | |
mov.u32 %r7, %r66; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd1+280], %r29; | |
ld.local.u64 %rd33, [%rd1+272]; | |
cvt.u64.u32 %rd34, %r7; | |
add.s64 %rd35, %rd33, %rd34; | |
ld.u8 %rs2, [%rd35]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd38, %r31, 28; | |
add.s64 %rd39, %rd23, %rd38; | |
add.s64 %rd13, %rd39, 20; | |
ld.global.u32 %r32, [%rd10+20]; | |
ld.global.u32 %r33, [%rd39+20]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB6_9; | |
ld.global.u8 %rs5, [%rd12+2]; | |
ld.global.u8 %rs6, [%rd13+-14]; | |
xor.b16 %rs7, %rs5, %rs6; | |
cvt.u32.u16 %r34, %rs7; | |
and.b32 %r35, %r34, 15; | |
ld.global.u8 %rs8, [%rd12+3]; | |
ld.global.u8 %rs9, [%rd13+-13]; | |
xor.b16 %rs10, %rs8, %rs9; | |
cvt.u32.u16 %r36, %rs10; | |
bfi.b32 %r37, %r35, %r36, 8, 24; | |
shl.b32 %r38, %r37, 4; | |
ld.global.u8 %rs11, [%rd12+4]; | |
ld.global.u8 %rs12, [%rd13+-12]; | |
xor.b16 %rs13, %rs11, %rs12; | |
cvt.u32.u16 %r39, %rs13; | |
and.b32 %r8, %r39, 255; | |
bfe.u32 %r40, %r39, 4, 4; | |
or.b32 %r41, %r40, %r38; | |
cvt.u64.u32 %rd14, %r41; | |
mul.wide.u32 %rd40, %r41, 4; | |
add.s64 %rd41, %rd18, %rd40; | |
add.s64 %rd42, %rd41, 262144; | |
atom.global.add.u32 %r9, [%rd42], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB6_9; | |
shl.b32 %r44, %r31, 16; | |
or.b32 %r45, %r6, %r44; | |
shl.b32 %r46, %r8, 28; | |
or.b32 %r47, %r45, %r46; | |
mul.lo.s64 %rd43, %rd14, 1792; | |
add.s64 %rd44, %rd5, %rd43; | |
mul.wide.u32 %rd45, %r9, 28; | |
add.s64 %rd46, %rd44, %rd45; | |
st.global.u32 [%rd46], %r47; | |
ld.global.u32 %r48, [%rd10+8]; | |
ld.global.u32 %r49, [%rd13+-12]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd46+4], %r50; | |
ld.global.u32 %r51, [%rd10+12]; | |
ld.global.u32 %r52, [%rd13+-8]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd46+8], %r53; | |
ld.global.u32 %r54, [%rd10+16]; | |
ld.global.u32 %r55, [%rd13+-4]; | |
xor.b32 %r56, %r54, %r55; | |
st.global.u32 [%rd46+12], %r56; | |
ld.global.u32 %r57, [%rd10+20]; | |
ld.global.u32 %r58, [%rd13]; | |
xor.b32 %r59, %r57, %r58; | |
st.global.u32 [%rd46+16], %r59; | |
BB6_9: | |
ld.local.v2.u32 {%r60, %r61}, [%rd1+280]; | |
mov.u32 %r66, %r60; | |
setp.lt.u32 %p7, %r60, %r61; | |
@%p7 bra BB6_6; | |
BB6_10: | |
cvt.u32.u64 %r63, %rd9; | |
add.s32 %r65, %r63, 1; | |
setp.lt.u32 %p8, %r65, %r4; | |
@%p8 bra BB6_3; | |
BB6_11: | |
add.s64 %rd47, %rd4, %rd8; | |
cvt.u32.u64 %r64, %rd47; | |
setp.lt.u32 %p9, %r64, 65536; | |
@%p9 bra BB6_2; | |
BB6_12: | |
ret; | |
} | |
// .globl digit_4 | |
.entry digit_4( | |
.param .u64 .ptr .global .align 4 digit_4_param_0, | |
.param .u64 .ptr .global .align 4 digit_4_param_1, | |
.param .u64 .ptr .global .align 4 digit_4_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot7[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<15>; | |
.reg .b32 %r<61>; | |
.reg .b64 %rd<51>; | |
mov.u64 %rd50, __local_depot7; | |
cvta.local.u64 %SP, %rd50; | |
ld.param.u64 %rd16, [digit_4_param_0]; | |
ld.param.u64 %rd17, [digit_4_param_1]; | |
ld.param.u64 %rd18, [digit_4_param_2]; | |
add.u64 %rd19, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd19; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r58, %r15, %r16; | |
setp.gt.u32 %p1, %r58, 65535; | |
@%p1 bra BB7_12; | |
cvt.s64.s32 %rd49, %r58; | |
add.s64 %rd3, %rd17, 4; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd4, %r18; | |
add.s64 %rd5, %rd16, 8; | |
BB7_2: | |
mov.u64 %rd6, %rd49; | |
mov.u16 %rs4, 0; | |
st.local.v4.u8 [%rd1], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+4], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+8], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+12], {%rs4, %rs4, %rs4, %rs4}; | |
and.b64 %rd8, %rd6, 4294967295; | |
shl.b64 %rd20, %rd8, 2; | |
add.s64 %rd21, %rd18, %rd20; | |
ld.global.u32 %r20, [%rd21+262144]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r59, 0; | |
st.global.u32 [%rd21+262144], %r59; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB7_11; | |
BB7_3: | |
cvt.u64.u32 %rd9, %r59; | |
mul.lo.s64 %rd22, %rd8, 1792; | |
add.s64 %rd23, %rd3, %rd22; | |
mul.wide.u32 %rd24, %r59, 28; | |
add.s64 %rd10, %rd23, %rd24; | |
ld.global.u32 %r22, [%rd10]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd11, %r23; | |
add.s64 %rd25, %rd1, %rd11; | |
ld.local.u8 %rs1, [%rd25]; | |
add.s16 %rs5, %rs1, 1; | |
st.local.u8 [%rd25], %rs5; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd1+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB7_10; | |
cvt.u64.u16 %rd26, %rs1; | |
shl.b64 %rd27, %rd11, 4; | |
add.s64 %rd29, %rd19, %rd27; | |
add.s64 %rd30, %rd29, 16; | |
st.local.u64 [%rd1+272], %rd30; | |
add.s64 %rd31, %rd1, %rd27; | |
add.s64 %rd32, %rd31, %rd26; | |
st.local.u8 [%rd32+16], %r59; | |
mov.u32 %r60, 0; | |
st.local.u32 [%rd1+280], %r60; | |
ld.local.u32 %r26, [%rd1+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB7_10; | |
shl.b32 %r28, %r59, 22; | |
or.b32 %r6, %r28, %r58; | |
add.s64 %rd12, %rd10, 4; | |
BB7_6: | |
mov.u32 %r7, %r60; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd1+280], %r29; | |
ld.local.u64 %rd33, [%rd1+272]; | |
cvt.u64.u32 %rd34, %r7; | |
add.s64 %rd35, %rd33, %rd34; | |
ld.u8 %rs2, [%rd35]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd38, %r31, 28; | |
add.s64 %rd39, %rd23, %rd38; | |
add.s64 %rd13, %rd39, 16; | |
ld.global.u32 %r32, [%rd10+16]; | |
ld.global.u32 %r33, [%rd39+16]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB7_9; | |
ld.global.u8 %rs6, [%rd12+1]; | |
ld.global.u8 %rs7, [%rd13+-11]; | |
xor.b16 %rs8, %rs6, %rs7; | |
cvt.u32.u16 %r35, %rs8; | |
and.b32 %r36, %r35, 255; | |
mul.wide.u32 %rd40, %r36, 256; | |
ld.global.u8 %rs9, [%rd12+2]; | |
ld.global.u8 %rs10, [%rd13+-10]; | |
xor.b16 %rs11, %rs9, %rs10; | |
cvt.u64.u16 %rd41, %rs11; | |
and.b64 %rd42, %rd41, 255; | |
or.b64 %rd14, %rd42, %rd40; | |
ld.global.u8 %rs12, [%rd12+3]; | |
ld.global.u8 %rs13, [%rd13+-9]; | |
xor.b16 %rs3, %rs12, %rs13; | |
shl.b64 %rd43, %rd14, 2; | |
add.s64 %rd44, %rd18, %rd43; | |
atom.global.add.u32 %r9, [%rd44], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB7_9; | |
shr.u16 %rs14, %rs3, 4; | |
cvt.u32.u16 %r37, %rs14; | |
shl.b32 %r38, %r37, 28; | |
shl.b32 %r39, %r31, 16; | |
or.b32 %r40, %r6, %r39; | |
or.b32 %r41, %r40, %r38; | |
mul.lo.s64 %rd45, %rd14, 1792; | |
add.s64 %rd46, %rd5, %rd45; | |
mul.wide.u32 %rd47, %r9, 28; | |
add.s64 %rd48, %rd46, %rd47; | |
st.global.u32 [%rd48], %r41; | |
ld.global.u32 %r42, [%rd10+4]; | |
ld.global.u32 %r43, [%rd13+-12]; | |
xor.b32 %r44, %r42, %r43; | |
st.global.u32 [%rd48+4], %r44; | |
ld.global.u32 %r45, [%rd10+8]; | |
ld.global.u32 %r46, [%rd13+-8]; | |
xor.b32 %r47, %r45, %r46; | |
st.global.u32 [%rd48+8], %r47; | |
ld.global.u32 %r48, [%rd10+12]; | |
ld.global.u32 %r49, [%rd13+-4]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd48+12], %r50; | |
ld.global.u32 %r51, [%rd10+16]; | |
ld.global.u32 %r52, [%rd13]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd48+16], %r53; | |
BB7_9: | |
ld.local.v2.u32 {%r54, %r55}, [%rd1+280]; | |
mov.u32 %r60, %r54; | |
setp.lt.u32 %p7, %r54, %r55; | |
@%p7 bra BB7_6; | |
BB7_10: | |
cvt.u32.u64 %r57, %rd9; | |
add.s32 %r59, %r57, 1; | |
setp.lt.u32 %p8, %r59, %r4; | |
@%p8 bra BB7_3; | |
BB7_11: | |
add.s64 %rd49, %rd4, %rd8; | |
cvt.u32.u64 %r58, %rd49; | |
setp.lt.u32 %p9, %r58, 65536; | |
@%p9 bra BB7_2; | |
BB7_12: | |
ret; | |
} | |
// .globl digit_5 | |
.entry digit_5( | |
.param .u64 .ptr .global .align 4 digit_5_param_0, | |
.param .u64 .ptr .global .align 4 digit_5_param_1, | |
.param .u64 .ptr .global .align 4 digit_5_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot8[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<14>; | |
.reg .b32 %r<64>; | |
.reg .b64 %rd<49>; | |
mov.u64 %rd48, __local_depot8; | |
cvta.local.u64 %SP, %rd48; | |
ld.param.u64 %rd16, [digit_5_param_0]; | |
ld.param.u64 %rd17, [digit_5_param_1]; | |
ld.param.u64 %rd18, [digit_5_param_2]; | |
add.u64 %rd19, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd19; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r61, %r15, %r16; | |
setp.gt.u32 %p1, %r61, 65535; | |
@%p1 bra BB8_12; | |
cvt.s64.s32 %rd47, %r61; | |
add.s64 %rd3, %rd16, 8; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd4, %r18; | |
add.s64 %rd5, %rd17, 8; | |
BB8_2: | |
mov.u64 %rd6, %rd47; | |
mov.u16 %rs3, 0; | |
st.local.v4.u8 [%rd1], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+4], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+8], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd1+12], {%rs3, %rs3, %rs3, %rs3}; | |
and.b64 %rd8, %rd6, 4294967295; | |
shl.b64 %rd20, %rd8, 2; | |
add.s64 %rd21, %rd18, %rd20; | |
ld.global.u32 %r20, [%rd21]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r62, 0; | |
st.global.u32 [%rd21], %r62; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB8_11; | |
BB8_3: | |
cvt.u64.u32 %rd9, %r62; | |
mul.lo.s64 %rd22, %rd8, 1792; | |
add.s64 %rd23, %rd3, %rd22; | |
mul.wide.u32 %rd24, %r62, 28; | |
add.s64 %rd10, %rd23, %rd24; | |
ld.global.u32 %r22, [%rd10]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd11, %r23; | |
add.s64 %rd25, %rd1, %rd11; | |
ld.local.u8 %rs1, [%rd25]; | |
add.s16 %rs4, %rs1, 1; | |
st.local.u8 [%rd25], %rs4; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd1+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB8_10; | |
cvt.u64.u16 %rd26, %rs1; | |
shl.b64 %rd27, %rd11, 4; | |
add.s64 %rd29, %rd19, %rd27; | |
add.s64 %rd30, %rd29, 16; | |
st.local.u64 [%rd1+272], %rd30; | |
add.s64 %rd31, %rd1, %rd27; | |
add.s64 %rd32, %rd31, %rd26; | |
st.local.u8 [%rd32+16], %r62; | |
mov.u32 %r63, 0; | |
st.local.u32 [%rd1+280], %r63; | |
ld.local.u32 %r26, [%rd1+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB8_10; | |
shl.b32 %r28, %r62, 22; | |
or.b32 %r6, %r28, %r61; | |
add.s64 %rd12, %rd10, 4; | |
BB8_6: | |
mov.u32 %r7, %r63; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd1+280], %r29; | |
ld.local.u64 %rd33, [%rd1+272]; | |
cvt.u64.u32 %rd34, %r7; | |
add.s64 %rd35, %rd33, %rd34; | |
ld.u8 %rs2, [%rd35]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd38, %r31, 28; | |
add.s64 %rd39, %rd23, %rd38; | |
add.s64 %rd13, %rd39, 16; | |
ld.global.u32 %r32, [%rd10+16]; | |
ld.global.u32 %r33, [%rd39+16]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB8_9; | |
ld.global.u8 %rs5, [%rd12+3]; | |
ld.global.u8 %rs6, [%rd13+-9]; | |
xor.b16 %rs7, %rs5, %rs6; | |
cvt.u32.u16 %r34, %rs7; | |
and.b32 %r35, %r34, 15; | |
ld.global.u8 %rs8, [%rd12+4]; | |
ld.global.u8 %rs9, [%rd13+-8]; | |
xor.b16 %rs10, %rs8, %rs9; | |
cvt.u32.u16 %r36, %rs10; | |
bfi.b32 %r37, %r35, %r36, 8, 24; | |
shl.b32 %r38, %r37, 4; | |
ld.global.u8 %rs11, [%rd12+5]; | |
ld.global.u8 %rs12, [%rd13+-7]; | |
xor.b16 %rs13, %rs11, %rs12; | |
cvt.u32.u16 %r39, %rs13; | |
and.b32 %r8, %r39, 255; | |
bfe.u32 %r40, %r39, 4, 4; | |
or.b32 %r41, %r40, %r38; | |
cvt.u64.u32 %rd14, %r41; | |
mul.wide.u32 %rd40, %r41, 4; | |
add.s64 %rd41, %rd18, %rd40; | |
add.s64 %rd42, %rd41, 262144; | |
atom.global.add.u32 %r9, [%rd42], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB8_9; | |
shl.b32 %r44, %r31, 16; | |
or.b32 %r45, %r6, %r44; | |
shl.b32 %r46, %r8, 28; | |
or.b32 %r47, %r45, %r46; | |
mul.lo.s64 %rd43, %rd14, 1792; | |
add.s64 %rd44, %rd5, %rd43; | |
mul.wide.u32 %rd45, %r9, 28; | |
add.s64 %rd46, %rd44, %rd45; | |
st.global.u32 [%rd46], %r47; | |
ld.global.u32 %r48, [%rd10+8]; | |
ld.global.u32 %r49, [%rd13+-8]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd46+4], %r50; | |
ld.global.u32 %r51, [%rd10+12]; | |
ld.global.u32 %r52, [%rd13+-4]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd46+8], %r53; | |
ld.global.u32 %r54, [%rd10+16]; | |
ld.global.u32 %r55, [%rd13]; | |
xor.b32 %r56, %r54, %r55; | |
st.global.u32 [%rd46+12], %r56; | |
BB8_9: | |
ld.local.v2.u32 {%r57, %r58}, [%rd1+280]; | |
mov.u32 %r63, %r57; | |
setp.lt.u32 %p7, %r57, %r58; | |
@%p7 bra BB8_6; | |
BB8_10: | |
cvt.u32.u64 %r60, %rd9; | |
add.s32 %r62, %r60, 1; | |
setp.lt.u32 %p8, %r62, %r4; | |
@%p8 bra BB8_3; | |
BB8_11: | |
add.s64 %rd47, %rd4, %rd8; | |
cvt.u32.u64 %r61, %rd47; | |
setp.lt.u32 %p9, %r61, 65536; | |
@%p9 bra BB8_2; | |
BB8_12: | |
ret; | |
} | |
// .globl digit_6 | |
.entry digit_6( | |
.param .u64 .ptr .global .align 4 digit_6_param_0, | |
.param .u64 .ptr .global .align 4 digit_6_param_1, | |
.param .u64 .ptr .global .align 4 digit_6_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot9[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<15>; | |
.reg .b32 %r<55>; | |
.reg .b64 %rd<51>; | |
mov.u64 %rd50, __local_depot9; | |
cvta.local.u64 %SP, %rd50; | |
ld.param.u64 %rd16, [digit_6_param_0]; | |
ld.param.u64 %rd17, [digit_6_param_1]; | |
ld.param.u64 %rd18, [digit_6_param_2]; | |
add.u64 %rd19, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd19; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r52, %r15, %r16; | |
setp.gt.u32 %p1, %r52, 65535; | |
@%p1 bra BB9_12; | |
cvt.s64.s32 %rd49, %r52; | |
add.s64 %rd3, %rd17, 8; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd4, %r18; | |
add.s64 %rd5, %rd16, 12; | |
BB9_2: | |
mov.u64 %rd6, %rd49; | |
mov.u16 %rs4, 0; | |
st.local.v4.u8 [%rd1], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+4], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+8], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd1+12], {%rs4, %rs4, %rs4, %rs4}; | |
and.b64 %rd8, %rd6, 4294967295; | |
shl.b64 %rd20, %rd8, 2; | |
add.s64 %rd21, %rd18, %rd20; | |
ld.global.u32 %r20, [%rd21+262144]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r53, 0; | |
st.global.u32 [%rd21+262144], %r53; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB9_11; | |
BB9_3: | |
cvt.u64.u32 %rd9, %r53; | |
mul.lo.s64 %rd22, %rd8, 1792; | |
add.s64 %rd23, %rd3, %rd22; | |
mul.wide.u32 %rd24, %r53, 28; | |
add.s64 %rd10, %rd23, %rd24; | |
ld.global.u32 %r22, [%rd10]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd11, %r23; | |
add.s64 %rd25, %rd1, %rd11; | |
ld.local.u8 %rs1, [%rd25]; | |
add.s16 %rs5, %rs1, 1; | |
st.local.u8 [%rd25], %rs5; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd1+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB9_10; | |
cvt.u64.u16 %rd26, %rs1; | |
shl.b64 %rd27, %rd11, 4; | |
add.s64 %rd29, %rd19, %rd27; | |
add.s64 %rd30, %rd29, 16; | |
st.local.u64 [%rd1+272], %rd30; | |
add.s64 %rd31, %rd1, %rd27; | |
add.s64 %rd32, %rd31, %rd26; | |
st.local.u8 [%rd32+16], %r53; | |
mov.u32 %r54, 0; | |
st.local.u32 [%rd1+280], %r54; | |
ld.local.u32 %r26, [%rd1+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB9_10; | |
shl.b32 %r28, %r53, 22; | |
or.b32 %r6, %r28, %r52; | |
add.s64 %rd12, %rd10, 4; | |
BB9_6: | |
mov.u32 %r7, %r54; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd1+280], %r29; | |
ld.local.u64 %rd33, [%rd1+272]; | |
cvt.u64.u32 %rd34, %r7; | |
add.s64 %rd35, %rd33, %rd34; | |
ld.u8 %rs2, [%rd35]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd38, %r31, 28; | |
add.s64 %rd39, %rd23, %rd38; | |
add.s64 %rd13, %rd39, 12; | |
ld.global.u32 %r32, [%rd10+12]; | |
ld.global.u32 %r33, [%rd39+12]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB9_9; | |
ld.global.u8 %rs6, [%rd12+2]; | |
ld.global.u8 %rs7, [%rd13+-6]; | |
xor.b16 %rs8, %rs6, %rs7; | |
cvt.u32.u16 %r35, %rs8; | |
and.b32 %r36, %r35, 255; | |
mul.wide.u32 %rd40, %r36, 256; | |
ld.global.u8 %rs9, [%rd12+3]; | |
ld.global.u8 %rs10, [%rd13+-5]; | |
xor.b16 %rs11, %rs9, %rs10; | |
cvt.u64.u16 %rd41, %rs11; | |
and.b64 %rd42, %rd41, 255; | |
or.b64 %rd14, %rd42, %rd40; | |
ld.global.u8 %rs12, [%rd12+4]; | |
ld.global.u8 %rs13, [%rd13+-4]; | |
xor.b16 %rs3, %rs12, %rs13; | |
shl.b64 %rd43, %rd14, 2; | |
add.s64 %rd44, %rd18, %rd43; | |
atom.global.add.u32 %r9, [%rd44], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB9_9; | |
shr.u16 %rs14, %rs3, 4; | |
cvt.u32.u16 %r37, %rs14; | |
shl.b32 %r38, %r37, 28; | |
shl.b32 %r39, %r31, 16; | |
or.b32 %r40, %r6, %r39; | |
or.b32 %r41, %r40, %r38; | |
mul.lo.s64 %rd45, %rd14, 1792; | |
add.s64 %rd46, %rd5, %rd45; | |
mul.wide.u32 %rd47, %r9, 28; | |
add.s64 %rd48, %rd46, %rd47; | |
st.global.u32 [%rd48], %r41; | |
ld.global.u32 %r42, [%rd10+8]; | |
ld.global.u32 %r43, [%rd13+-4]; | |
xor.b32 %r44, %r42, %r43; | |
st.global.u32 [%rd48+4], %r44; | |
ld.global.u32 %r45, [%rd10+12]; | |
ld.global.u32 %r46, [%rd13]; | |
xor.b32 %r47, %r45, %r46; | |
st.global.u32 [%rd48+8], %r47; | |
BB9_9: | |
ld.local.v2.u32 {%r48, %r49}, [%rd1+280]; | |
mov.u32 %r54, %r48; | |
setp.lt.u32 %p7, %r48, %r49; | |
@%p7 bra BB9_6; | |
BB9_10: | |
cvt.u32.u64 %r51, %rd9; | |
add.s32 %r53, %r51, 1; | |
setp.lt.u32 %p8, %r53, %r4; | |
@%p8 bra BB9_3; | |
BB9_11: | |
add.s64 %rd49, %rd4, %rd8; | |
cvt.u32.u64 %r52, %rd49; | |
setp.lt.u32 %p9, %r52, 65536; | |
@%p9 bra BB9_2; | |
BB9_12: | |
ret; | |
} | |
// .globl digit_7 | |
.entry digit_7( | |
.param .u64 .ptr .global .align 4 digit_7_param_0, | |
.param .u64 .ptr .global .align 4 digit_7_param_1, | |
.param .u64 .ptr .global .align 4 digit_7_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot10[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<14>; | |
.reg .b32 %r<61>; | |
.reg .b64 %rd<53>; | |
mov.u64 %rd52, __local_depot10; | |
cvta.local.u64 %SP, %rd52; | |
ld.param.u64 %rd11, [digit_7_param_0]; | |
ld.param.u64 %rd12, [digit_7_param_1]; | |
ld.param.u64 %rd13, [digit_7_param_2]; | |
mov.u32 %r13, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r14, %envreg3; | |
mad.lo.s32 %r15, %r13, %r1, %r14; | |
mov.u32 %r16, %tid.x; | |
add.s32 %r58, %r15, %r16; | |
setp.gt.u32 %p1, %r58, 65535; | |
@%p1 bra BB10_12; | |
cvt.s64.s32 %rd51, %r58; | |
mov.b32 %r17, %envreg6; | |
mul.lo.s32 %r18, %r1, %r17; | |
cvt.s64.s32 %rd2, %r18; | |
BB10_2: | |
mov.u64 %rd3, %rd51; | |
add.u64 %rd14, %SP, 0; | |
cvta.to.local.u64 %rd15, %rd14; | |
mov.u16 %rs3, 0; | |
st.local.v4.u8 [%rd15], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd15+4], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd15+8], {%rs3, %rs3, %rs3, %rs3}; | |
st.local.v4.u8 [%rd15+12], {%rs3, %rs3, %rs3, %rs3}; | |
and.b64 %rd4, %rd3, 4294967295; | |
shl.b64 %rd16, %rd4, 2; | |
add.s64 %rd17, %rd13, %rd16; | |
ld.global.u32 %r20, [%rd17]; | |
mov.u32 %r21, 64; | |
min.u32 %r4, %r20, %r21; | |
mov.u32 %r59, 0; | |
st.global.u32 [%rd17], %r59; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB10_11; | |
BB10_3: | |
mul.lo.s64 %rd20, %rd4, 1792; | |
add.s64 %rd21, %rd11, %rd20; | |
cvt.u64.u32 %rd5, %r59; | |
mul.wide.u32 %rd22, %r59, 28; | |
add.s64 %rd23, %rd21, %rd22; | |
add.s64 %rd6, %rd23, 12; | |
ld.global.u32 %r22, [%rd23+12]; | |
shr.u32 %r23, %r22, 28; | |
cvt.u64.u32 %rd7, %r23; | |
add.s64 %rd24, %rd15, %rd7; | |
ld.local.u8 %rs1, [%rd24]; | |
add.s16 %rs4, %rs1, 1; | |
st.local.u8 [%rd24], %rs4; | |
cvt.u32.u16 %r24, %rs1; | |
st.local.u32 [%rd15+284], %r24; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB10_10; | |
cvt.u64.u16 %rd25, %rs1; | |
shl.b64 %rd26, %rd7, 4; | |
add.s64 %rd28, %rd14, %rd26; | |
add.s64 %rd29, %rd28, 16; | |
st.local.u64 [%rd15+272], %rd29; | |
add.s64 %rd31, %rd15, %rd26; | |
add.s64 %rd32, %rd31, %rd25; | |
st.local.u8 [%rd32+16], %r59; | |
mov.u32 %r60, 0; | |
st.local.u32 [%rd15+280], %r60; | |
ld.local.u32 %r26, [%rd15+284]; | |
setp.eq.s32 %p4, %r26, 0; | |
@%p4 bra BB10_10; | |
shl.b32 %r28, %r59, 22; | |
or.b32 %r6, %r28, %r58; | |
BB10_6: | |
mov.u32 %r7, %r60; | |
add.s32 %r29, %r7, 1; | |
st.local.u32 [%rd15+280], %r29; | |
ld.local.u64 %rd37, [%rd15+272]; | |
cvt.u64.u32 %rd38, %r7; | |
add.s64 %rd39, %rd37, %rd38; | |
ld.u8 %rs2, [%rd39]; | |
cvt.u32.u16 %r30, %rs2; | |
and.b32 %r31, %r30, 255; | |
mul.wide.u32 %rd40, %r31, 28; | |
add.s64 %rd41, %rd21, %rd40; | |
add.s64 %rd8, %rd41, 20; | |
ld.global.u32 %r32, [%rd6+8]; | |
ld.global.u32 %r33, [%rd41+20]; | |
setp.eq.s32 %p5, %r33, %r32; | |
@%p5 bra BB10_9; | |
ld.global.u8 %rs5, [%rd6+4]; | |
ld.global.u8 %rs6, [%rd8+-4]; | |
xor.b16 %rs7, %rs5, %rs6; | |
cvt.u32.u16 %r34, %rs7; | |
and.b32 %r35, %r34, 15; | |
ld.global.u8 %rs8, [%rd6+5]; | |
ld.global.u8 %rs9, [%rd8+-3]; | |
xor.b16 %rs10, %rs8, %rs9; | |
cvt.u32.u16 %r36, %rs10; | |
bfi.b32 %r37, %r35, %r36, 8, 24; | |
shl.b32 %r38, %r37, 4; | |
ld.global.u8 %rs11, [%rd6+6]; | |
ld.global.u8 %rs12, [%rd8+-2]; | |
xor.b16 %rs13, %rs11, %rs12; | |
cvt.u32.u16 %r39, %rs13; | |
and.b32 %r8, %r39, 255; | |
bfe.u32 %r40, %r39, 4, 4; | |
or.b32 %r41, %r40, %r38; | |
cvt.u64.u32 %rd9, %r41; | |
mul.wide.u32 %rd42, %r41, 4; | |
add.s64 %rd43, %rd13, %rd42; | |
add.s64 %rd44, %rd43, 262144; | |
atom.global.add.u32 %r9, [%rd44], 1; | |
setp.gt.u32 %p6, %r9, 63; | |
@%p6 bra BB10_9; | |
mul.lo.s64 %rd45, %rd9, 1792; | |
add.s64 %rd46, %rd12, %rd45; | |
shl.b32 %r44, %r31, 16; | |
or.b32 %r45, %r6, %r44; | |
shl.b32 %r46, %r8, 28; | |
or.b32 %r47, %r45, %r46; | |
mul.wide.u32 %rd47, %r9, 28; | |
add.s64 %rd48, %rd46, %rd47; | |
st.global.u32 [%rd48+12], %r47; | |
ld.global.u32 %r48, [%rd6+4]; | |
ld.global.u32 %r49, [%rd8+-4]; | |
xor.b32 %r50, %r48, %r49; | |
st.global.u32 [%rd48+16], %r50; | |
ld.global.u32 %r51, [%rd6+8]; | |
ld.global.u32 %r52, [%rd8]; | |
xor.b32 %r53, %r51, %r52; | |
st.global.u32 [%rd48+20], %r53; | |
BB10_9: | |
ld.local.v2.u32 {%r54, %r55}, [%rd15+280]; | |
mov.u32 %r60, %r54; | |
setp.lt.u32 %p7, %r54, %r55; | |
@%p7 bra BB10_6; | |
BB10_10: | |
cvt.u32.u64 %r57, %rd5; | |
add.s32 %r59, %r57, 1; | |
setp.lt.u32 %p8, %r59, %r4; | |
@%p8 bra BB10_3; | |
BB10_11: | |
add.s64 %rd51, %rd2, %rd4; | |
cvt.u32.u64 %r58, %rd51; | |
setp.lt.u32 %p9, %r58, 65536; | |
@%p9 bra BB10_2; | |
BB10_12: | |
ret; | |
} | |
// .globl digit_8 | |
.entry digit_8( | |
.param .u64 .ptr .global .align 4 digit_8_param_0, | |
.param .u64 .ptr .global .align 4 digit_8_param_1, | |
.param .u64 .ptr .global .align 4 digit_8_param_2 | |
) | |
{ | |
.local .align 8 .b8 __local_depot11[296]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<10>; | |
.reg .b16 %rs<12>; | |
.reg .b32 %r<53>; | |
.reg .b64 %rd<56>; | |
mov.u64 %rd55, __local_depot11; | |
cvta.local.u64 %SP, %rd55; | |
ld.param.u64 %rd12, [digit_8_param_0]; | |
ld.param.u64 %rd13, [digit_8_param_1]; | |
ld.param.u64 %rd14, [digit_8_param_2]; | |
mov.u32 %r15, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r16, %envreg3; | |
mad.lo.s32 %r17, %r15, %r1, %r16; | |
mov.u32 %r18, %tid.x; | |
add.s32 %r50, %r17, %r18; | |
setp.gt.u32 %p1, %r50, 65535; | |
@%p1 bra BB11_12; | |
cvt.s64.s32 %rd54, %r50; | |
mov.b32 %r19, %envreg6; | |
mul.lo.s32 %r20, %r1, %r19; | |
cvt.s64.s32 %rd2, %r20; | |
BB11_2: | |
mov.u64 %rd3, %rd54; | |
add.u64 %rd15, %SP, 0; | |
cvta.to.local.u64 %rd16, %rd15; | |
mov.u16 %rs4, 0; | |
st.local.v4.u8 [%rd16], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd16+4], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd16+8], {%rs4, %rs4, %rs4, %rs4}; | |
st.local.v4.u8 [%rd16+12], {%rs4, %rs4, %rs4, %rs4}; | |
and.b64 %rd4, %rd3, 4294967295; | |
shl.b64 %rd17, %rd4, 2; | |
add.s64 %rd18, %rd14, %rd17; | |
ld.global.u32 %r22, [%rd18+262144]; | |
mov.u32 %r23, 64; | |
min.u32 %r4, %r22, %r23; | |
mov.u32 %r51, 0; | |
st.global.u32 [%rd18+262144], %r51; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB11_11; | |
BB11_3: | |
mul.lo.s64 %rd21, %rd4, 1792; | |
add.s64 %rd22, %rd13, %rd21; | |
cvt.u64.u32 %rd5, %r51; | |
mul.wide.u32 %rd23, %r51, 28; | |
add.s64 %rd24, %rd22, %rd23; | |
add.s64 %rd6, %rd24, 12; | |
ld.global.u32 %r24, [%rd24+12]; | |
shr.u32 %r25, %r24, 28; | |
cvt.u64.u32 %rd7, %r25; | |
add.s64 %rd25, %rd16, %rd7; | |
ld.local.u8 %rs1, [%rd25]; | |
add.s16 %rs5, %rs1, 1; | |
st.local.u8 [%rd25], %rs5; | |
cvt.u32.u16 %r26, %rs1; | |
st.local.u32 [%rd16+284], %r26; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB11_10; | |
cvt.u64.u16 %rd26, %rs1; | |
shl.b64 %rd27, %rd7, 4; | |
add.s64 %rd29, %rd15, %rd27; | |
add.s64 %rd30, %rd29, 16; | |
st.local.u64 [%rd16+272], %rd30; | |
add.s64 %rd32, %rd16, %rd27; | |
add.s64 %rd33, %rd32, %rd26; | |
st.local.u8 [%rd33+16], %r51; | |
mov.u32 %r52, 0; | |
st.local.u32 [%rd16+280], %r52; | |
ld.local.u32 %r28, [%rd16+284]; | |
setp.eq.s32 %p4, %r28, 0; | |
@%p4 bra BB11_10; | |
shl.b32 %r30, %r51, 22; | |
or.b32 %r6, %r30, %r50; | |
add.s64 %rd8, %rd6, 4; | |
BB11_6: | |
mov.u32 %r7, %r52; | |
add.s32 %r31, %r7, 1; | |
st.local.u32 [%rd16+280], %r31; | |
ld.local.u64 %rd38, [%rd16+272]; | |
cvt.u64.u32 %rd39, %r7; | |
add.s64 %rd40, %rd38, %rd39; | |
ld.u8 %rs2, [%rd40]; | |
cvt.u32.u16 %r32, %rs2; | |
and.b32 %r33, %r32, 255; | |
mul.wide.u32 %rd41, %r33, 28; | |
add.s64 %rd42, %rd22, %rd41; | |
add.s64 %rd9, %rd42, 20; | |
ld.global.u32 %r8, [%rd6+8]; | |
ld.global.u32 %r9, [%rd42+20]; | |
setp.eq.s32 %p5, %r9, %r8; | |
@%p5 bra BB11_9; | |
ld.global.u8 %rs6, [%rd8+3]; | |
ld.global.u8 %rs7, [%rd9+-1]; | |
xor.b16 %rs8, %rs6, %rs7; | |
cvt.u32.u16 %r35, %rs8; | |
and.b32 %r36, %r35, 255; | |
mul.wide.u32 %rd43, %r36, 256; | |
xor.b32 %r37, %r8, %r9; | |
cvt.u64.u32 %rd44, %r37; | |
and.b64 %rd45, %rd44, 255; | |
or.b64 %rd10, %rd45, %rd43; | |
ld.global.u8 %rs9, [%rd8+5]; | |
ld.global.u8 %rs10, [%rd9+1]; | |
xor.b16 %rs3, %rs9, %rs10; | |
shl.b64 %rd46, %rd10, 2; | |
add.s64 %rd47, %rd14, %rd46; | |
atom.global.add.u32 %r11, [%rd47], 1; | |
setp.gt.u32 %p6, %r11, 63; | |
@%p6 bra BB11_9; | |
mul.lo.s64 %rd48, %rd10, 1792; | |
add.s64 %rd49, %rd12, %rd48; | |
shr.u16 %rs11, %rs3, 4; | |
cvt.u32.u16 %r38, %rs11; | |
shl.b32 %r39, %r38, 28; | |
shl.b32 %r40, %r33, 16; | |
or.b32 %r41, %r6, %r40; | |
or.b32 %r42, %r41, %r39; | |
mul.wide.u32 %rd50, %r11, 28; | |
add.s64 %rd51, %rd49, %rd50; | |
st.global.u32 [%rd51+16], %r42; | |
ld.global.u32 %r43, [%rd6+8]; | |
ld.global.u32 %r44, [%rd9]; | |
xor.b32 %r45, %r43, %r44; | |
st.global.u32 [%rd51+20], %r45; | |
BB11_9: | |
ld.local.v2.u32 {%r46, %r47}, [%rd16+280]; | |
mov.u32 %r52, %r46; | |
setp.lt.u32 %p7, %r46, %r47; | |
@%p7 bra BB11_6; | |
BB11_10: | |
cvt.u32.u64 %r49, %rd5; | |
add.s32 %r51, %r49, 1; | |
setp.lt.u32 %p8, %r51, %r4; | |
@%p8 bra BB11_3; | |
BB11_11: | |
add.s64 %rd54, %rd2, %rd4; | |
cvt.u32.u64 %r50, %rd54; | |
setp.lt.u32 %p9, %r50, 65536; | |
@%p9 bra BB11_2; | |
BB11_12: | |
ret; | |
} | |
// .globl digitK | |
.entry digitK( | |
.param .u64 .ptr .global .align 4 digitK_param_0, | |
.param .u64 .ptr .global .align 4 digitK_param_1, | |
.param .u64 .ptr .global .align 4 digitK_param_2, | |
.param .u64 .ptr .global .align 4 digitK_param_3, | |
.param .u64 .ptr .global .align 4 digitK_param_4 | |
) | |
{ | |
.local .align 16 .b8 __local_depot12[3376]; | |
.reg .b64 %SP; | |
.reg .b64 %SPL; | |
.reg .pred %p<802>; | |
.reg .b16 %rs<22>; | |
.reg .b32 %r<22617>; | |
.reg .b64 %rd<5901>; | |
mov.u64 %rd5900, __local_depot12; | |
cvta.local.u64 %SP, %rd5900; | |
ld.param.u64 %rd414, [digitK_param_0]; | |
ld.param.u64 %rd415, [digitK_param_1]; | |
ld.param.u64 %rd417, [digitK_param_3]; | |
add.u64 %rd419, %SP, 0; | |
cvta.to.local.u64 %rd1, %rd419; | |
add.u64 %rd420, %SP, 1024; | |
cvta.to.local.u64 %rd2, %rd420; | |
mov.u32 %r5213, %ctaid.x; | |
mov.u32 %r1, %ntid.x; | |
mov.b32 %r5214, %envreg3; | |
mad.lo.s32 %r5215, %r5213, %r1, %r5214; | |
mov.u32 %r5216, %tid.x; | |
add.s32 %r11394, %r5215, %r5216; | |
setp.gt.u32 %p1, %r11394, 65535; | |
@%p1 bra BB12_1569; | |
cvt.s64.s32 %rd5899, %r11394; | |
add.s64 %rd4, %rd414, 16; | |
mov.b32 %r5217, %envreg6; | |
mul.lo.s32 %r5218, %r1, %r5217; | |
cvt.s64.s32 %rd5, %r5218; | |
add.s64 %rd6, %rd415, 12; | |
BB12_2: | |
ld.param.u64 %rd5892, [digitK_param_2]; | |
add.u64 %rd421, %SP, 3072; | |
cvta.to.local.u64 %rd422, %rd421; | |
mov.u16 %rs11, 0; | |
st.local.v4.u8 [%rd422], {%rs11, %rs11, %rs11, %rs11}; | |
st.local.v4.u8 [%rd422+4], {%rs11, %rs11, %rs11, %rs11}; | |
st.local.v4.u8 [%rd422+8], {%rs11, %rs11, %rs11, %rs11}; | |
st.local.v4.u8 [%rd422+12], {%rs11, %rs11, %rs11, %rs11}; | |
and.b64 %rd8, %rd5899, 4294967295; | |
shl.b64 %rd423, %rd8, 2; | |
add.s64 %rd424, %rd5892, %rd423; | |
ld.global.u32 %r5219, [%rd424]; | |
mov.u32 %r5220, 64; | |
min.u32 %r4, %r5219, %r5220; | |
mov.u32 %r11395, 0; | |
st.global.u32 [%rd424], %r11395; | |
setp.eq.s32 %p2, %r4, 0; | |
@%p2 bra BB12_1568; | |
BB12_3: | |
and.b64 %rd5893, %rd5899, 4294967295; | |
cvt.u64.u32 %rd10, %r11395; | |
mul.lo.s64 %rd425, %rd5893, 1792; | |
add.s64 %rd426, %rd4, %rd425; | |
mul.wide.u32 %rd427, %r11395, 28; | |
add.s64 %rd11, %rd426, %rd427; | |
ld.global.u32 %r5223, [%rd11]; | |
shr.u32 %r5224, %r5223, 28; | |
cvt.u64.u32 %rd12, %r5224; | |
add.s64 %rd430, %rd422, %rd12; | |
ld.local.u8 %rs1, [%rd430]; | |
add.s16 %rs12, %rs1, 1; | |
st.local.u8 [%rd430], %rs12; | |
cvt.u32.u16 %r5225, %rs1; | |
st.local.u32 [%rd422+284], %r5225; | |
setp.gt.u16 %p3, %rs1, 15; | |
@%p3 bra BB12_5; | |
add.u64 %rd5894, %SP, 3072; | |
cvt.u64.u16 %rd431, %rs1; | |
shl.b64 %rd432, %rd12, 4; | |
add.s64 %rd434, %rd5894, %rd432; | |
add.s64 %rd435, %rd434, 16; | |
st.local.u64 [%rd422+272], %rd435; | |
add.s64 %rd437, %rd422, %rd432; | |
add.s64 %rd438, %rd437, %rd431; | |
st.local.u8 [%rd438+16], %r11395; | |
mov.u32 %r5226, 0; | |
st.local.u32 [%rd422+280], %r5226; | |
BB12_5: | |
@%p3 bra BB12_1567; | |
ld.local.v2.u32 {%r5227, %r5228}, [%rd422+280]; | |
mov.u32 %r11396, %r5227; | |
setp.ge.u32 %p5, %r5227, %r5228; | |
@%p5 bra BB12_1567; | |
BB12_7: | |
mov.u32 %r8, %r11396; | |
and.b64 %rd5897, %rd5899, 4294967295; | |
mul.lo.s64 %rd5896, %rd5893, 1792; | |
add.s64 %rd5895, %rd4, %rd5896; | |
add.s32 %r5230, %r8, 1; | |
st.local.u32 [%rd422+280], %r5230; | |
ld.local.u64 %rd443, [%rd422+272]; | |
cvt.u64.u32 %rd444, %r8; | |
add.s64 %rd445, %rd443, %rd444; | |
ld.u8 %rs2, [%rd445]; | |
cvt.u32.u16 %r5231, %rs2; | |
and.b32 %r5232, %r5231, 255; | |
mul.wide.u32 %rd448, %r5232, 28; | |
add.s64 %rd449, %rd5895, %rd448; | |
ld.global.u32 %r5233, [%rd11+4]; | |
ld.global.u32 %r5234, [%rd449+4]; | |
setp.ne.s32 %p6, %r5234, %r5233; | |
@%p6 bra BB12_1566; | |
and.b64 %rd5898, %rd5899, 65535; | |
shr.u32 %r5237, %r11394, 16; | |
or.b32 %r5238, %r5237, %r5232; | |
and.b32 %r5239, %r5238, 63; | |
mul.lo.s64 %rd450, %rd5898, 1792; | |
add.s64 %rd451, %rd4, %rd450; | |
mul.wide.u32 %rd452, %r5239, 28; | |
add.s64 %rd13, %rd451, %rd452; | |
ld.global.u32 %r10, [%rd13]; | |
and.b32 %r5240, %r10, 65535; | |
bfe.u32 %r5241, %r10, 16, 6; | |
mul.wide.u32 %rd453, %r5240, 1792; | |
add.s64 %rd454, %rd6, %rd453; | |
mul.wide.u32 %rd455, %r5241, 28; | |
add.s64 %rd456, %rd454, %rd455; | |
ld.global.u32 %r11, [%rd456]; | |
and.b32 %r5242, %r11, 65535; | |
mul.wide.u32 %rd457, %r5242, 1792; | |
add.s64 %rd458, %rd4, %rd457; | |
bfe.u32 %r5243, %r11, 16, 6; | |
mul.wide.u32 %rd459, %r5243, 28; | |
add.s64 %rd460, %rd458, %rd459; | |
ld.global.u32 %r12, [%rd460+-4]; | |
and.b32 %r5244, %r12, 65535; | |
mul.wide.u32 %rd461, %r5244, 1792; | |
add.s64 %rd462, %rd6, %rd461; | |
bfe.u32 %r5245, %r12, 16, 6; | |
mul.wide.u32 %rd463, %r5245, 28; | |
add.s64 %rd464, %rd462, %rd463; | |
ld.global.u32 %r13, [%rd464+-4]; | |
and.b32 %r5246, %r13, 65535; | |
mul.wide.u32 %rd465, %r5246, 1792; | |
add.s64 %rd466, %rd4, %rd465; | |
bfe.u32 %r5247, %r13, 16, 6; | |
mul.wide.u32 %rd467, %r5247, 28; | |
add.s64 %rd468, %rd466, %rd467; | |
ld.global.u32 %r14, [%rd468+-8]; | |
and.b32 %r5248, %r14, 65535; | |
mul.wide.u32 %rd469, %r5248, 1792; | |
add.s64 %rd470, %rd6, %rd469; | |
bfe.u32 %r5249, %r14, 16, 6; | |
mul.wide.u32 %rd471, %r5249, 28; | |
add.s64 %rd472, %rd470, %rd471; | |
ld.global.u32 %r15, [%rd472+-8]; | |
and.b32 %r5250, %r15, 65535; | |
mul.wide.u32 %rd473, %r5250, 1792; | |
add.s64 %rd474, %rd4, %rd473; | |
shl.b32 %r5251, %r5232, 16; | |
or.b32 %r9, %r5251, %r11394; | |
cvt.u64.u32 %rd14, %r5240; | |
cvt.u64.u32 %rd15, %r5242; | |
cvt.u64.u32 %rd16, %r5244; | |
cvt.u64.u32 %rd17, %r5246; | |
cvt.u64.u32 %rd18, %r5248; | |
cvt.u64.u32 %rd19, %r5250; | |
bfe.u32 %r5252, %r15, 16, 6; | |
mul.wide.u32 %rd475, %r5252, 28; | |
add.s64 %rd476, %rd474, %rd475; | |
ld.global.u32 %r16, [%rd476+-12]; | |
and.b32 %r5253, %r16, 65535; | |
cvt.u64.u32 %rd20, %r5253; | |
bfe.u32 %r5254, %r16, 16, 6; | |
mul.wide.u32 %rd477, %r5253, 1792; | |
add.s64 %rd478, %rd415, %rd477; | |
mul.wide.u32 %rd479, %r5254, 28; | |
add.s64 %rd480, %rd478, %rd479; | |
ld.global.u32 %r5255, [%rd480]; | |
and.b32 %r5256, %r5255, 65535; | |
bfe.u32 %r5257, %r5255, 16, 6; | |
mul.wide.u32 %rd481, %r5256, 1792; | |
add.s64 %rd482, %rd414, %rd481; | |
mul.wide.u32 %rd483, %r5257, 28; | |
add.s64 %rd484, %rd482, %rd483; | |
ld.global.u32 %r5258, [%rd484]; | |
and.b32 %r5259, %r5258, 65535; | |
shl.b32 %r5260, %r5259, 6; | |
bfe.u32 %r5261, %r5258, 16, 6; | |
or.b32 %r17, %r5260, %r5261; | |
st.local.u32 [%rd2], %r17; | |
bfe.u32 %r5262, %r5255, 22, 6; | |
mul.wide.u32 %rd485, %r5262, 28; | |
add.s64 %rd486, %rd482, %rd485; | |
ld.global.u32 %r5263, [%rd486]; | |
and.b32 %r5264, %r5263, 65535; | |
shl.b32 %r5265, %r5264, 6; | |
bfe.u32 %r5266, %r5263, 16, 6; | |
or.b32 %r13314, %r5265, %r5266; | |
st.local.u32 [%rd2+4], %r13314; | |
setp.le.u32 %p7, %r17, %r13314; | |
mov.u32 %r13313, %r17; | |
@%p7 bra BB12_10; | |
st.local.v2.u32 [%rd2], {%r13314, %r17}; | |
mov.u32 %r11397, %r13314; | |
mov.u32 %r13314, %r17; | |
mov.u32 %r13313, %r11397; | |
BB12_10: | |
mov.u32 %r13309, %r13313; | |
mov.u32 %r13310, %r13314; | |
bfe.u32 %r5267, %r16, 22, 6; | |
mul.lo.s64 %rd487, %rd20, 1792; | |
add.s64 %rd488, %rd415, %rd487; | |
mul.wide.u32 %rd489, %r5267, 28; | |
add.s64 %rd490, %rd488, %rd489; | |
ld.global.u32 %r5268, [%rd490]; | |
and.b32 %r5269, %r5268, 65535; | |
bfe.u32 %r5270, %r5268, 16, 6; | |
mul.wide.u32 %rd491, %r5269, 1792; | |
add.s64 %rd492, %rd414, %rd491; | |
mul.wide.u32 %rd493, %r5270, 28; | |
add.s64 %rd494, %rd492, %rd493; | |
ld.global.u32 %r5271, [%rd494]; | |
and.b32 %r5272, %r5271, 65535; | |
shl.b32 %r5273, %r5272, 6; | |
bfe.u32 %r5274, %r5271, 16, 6; | |
or.b32 %r21, %r5273, %r5274; | |
st.local.u32 [%rd2+8], %r21; | |
bfe.u32 %r5275, %r5268, 22, 6; | |
mul.wide.u32 %rd495, %r5275, 28; | |
add.s64 %rd496, %rd492, %rd495; | |
ld.global.u32 %r5276, [%rd496]; | |
and.b32 %r5277, %r5276, 65535; | |
shl.b32 %r5278, %r5277, 6; | |
bfe.u32 %r5279, %r5276, 16, 6; | |
or.b32 %r13316, %r5278, %r5279; | |
st.local.u32 [%rd2+12], %r13316; | |
setp.le.u32 %p8, %r21, %r13316; | |
mov.u32 %r13315, %r21; | |
@%p8 bra BB12_12; | |
st.local.v2.u32 [%rd2+8], {%r13316, %r21}; | |
mov.u32 %r11403, %r13316; | |
mov.u32 %r13316, %r21; | |
mov.u32 %r13315, %r11403; | |
BB12_12: | |
mov.u32 %r24, %r13315; | |
mov.u32 %r23, %r13316; | |
setp.le.u32 %p9, %r13309, %r24; | |
mov.u32 %r13311, %r24; | |
mov.u32 %r13312, %r23; | |
@%p9 bra BB12_14; | |
st.local.v4.u32 [%rd2], {%r24, %r23, %r13309, %r13310}; | |
mov.u32 %r11400, %r13310; | |
mov.u32 %r11402, %r13309; | |
mov.u32 %r13310, %r23; | |
mov.u32 %r13309, %r24; | |
mov.u32 %r13311, %r11402; | |
mov.u32 %r13312, %r11400; | |
BB12_14: | |
mov.u32 %r13301, %r13309; | |
mov.u32 %r13302, %r13310; | |
mov.u32 %r13303, %r13311; | |
mov.u32 %r13304, %r13312; | |
mul.lo.s64 %rd497, %rd19, 1792; | |
add.s64 %rd498, %rd4, %rd497; | |
bfe.u32 %r5280, %r15, 22, 6; | |
mul.wide.u32 %rd499, %r5280, 28; | |
add.s64 %rd500, %rd498, %rd499; | |
ld.global.u32 %r29, [%rd500+-12]; | |
and.b32 %r5281, %r29, 65535; | |
cvt.u64.u32 %rd22, %r5281; | |
bfe.u32 %r5282, %r29, 16, 6; | |
mul.wide.u32 %rd501, %r5281, 1792; | |
add.s64 %rd502, %rd415, %rd501; | |
mul.wide.u32 %rd503, %r5282, 28; | |
add.s64 %rd504, %rd502, %rd503; | |
ld.global.u32 %r5283, [%rd504]; | |
and.b32 %r5284, %r5283, 65535; | |
bfe.u32 %r5285, %r5283, 16, 6; | |
mul.wide.u32 %rd505, %r5284, 1792; | |
add.s64 %rd506, %rd414, %rd505; | |
mul.wide.u32 %rd507, %r5285, 28; | |
add.s64 %rd508, %rd506, %rd507; | |
ld.global.u32 %r5286, [%rd508]; | |
and.b32 %r5287, %r5286, 65535; | |
shl.b32 %r5288, %r5287, 6; | |
bfe.u32 %r5289, %r5286, 16, 6; | |
or.b32 %r30, %r5288, %r5289; | |
st.local.u32 [%rd2+16], %r30; | |
bfe.u32 %r5290, %r5283, 22, 6; | |
mul.wide.u32 %rd509, %r5290, 28; | |
add.s64 %rd510, %rd506, %rd509; | |
ld.global.u32 %r5291, [%rd510]; | |
and.b32 %r5292, %r5291, 65535; | |
shl.b32 %r5293, %r5292, 6; | |
bfe.u32 %r5294, %r5291, 16, 6; | |
or.b32 %r13322, %r5293, %r5294; | |
st.local.u32 [%rd2+20], %r13322; | |
setp.le.u32 %p10, %r30, %r13322; | |
mov.u32 %r13321, %r30; | |
@%p10 bra BB12_16; | |
st.local.v2.u32 [%rd2+16], {%r13322, %r30}; | |
mov.u32 %r11417, %r13322; | |
mov.u32 %r13322, %r30; | |
mov.u32 %r13321, %r11417; | |
BB12_16: | |
mov.u32 %r13317, %r13321; | |
mov.u32 %r13318, %r13322; | |
bfe.u32 %r5295, %r29, 22, 6; | |
mul.lo.s64 %rd511, %rd22, 1792; | |
add.s64 %rd512, %rd415, %rd511; | |
mul.wide.u32 %rd513, %r5295, 28; | |
add.s64 %rd514, %rd512, %rd513; | |
ld.global.u32 %r5296, [%rd514]; | |
and.b32 %r5297, %r5296, 65535; | |
bfe.u32 %r5298, %r5296, 16, 6; | |
mul.wide.u32 %rd515, %r5297, 1792; | |
add.s64 %rd516, %rd414, %rd515; | |
mul.wide.u32 %rd517, %r5298, 28; | |
add.s64 %rd518, %rd516, %rd517; | |
ld.global.u32 %r5299, [%rd518]; | |
and.b32 %r5300, %r5299, 65535; | |
shl.b32 %r5301, %r5300, 6; | |
bfe.u32 %r5302, %r5299, 16, 6; | |
or.b32 %r34, %r5301, %r5302; | |
st.local.u32 [%rd2+24], %r34; | |
bfe.u32 %r5303, %r5296, 22, 6; | |
mul.wide.u32 %rd519, %r5303, 28; | |
add.s64 %rd520, %rd516, %rd519; | |
ld.global.u32 %r5304, [%rd520]; | |
and.b32 %r5305, %r5304, 65535; | |
shl.b32 %r5306, %r5305, 6; | |
bfe.u32 %r5307, %r5304, 16, 6; | |
or.b32 %r13324, %r5306, %r5307; | |
st.local.u32 [%rd2+28], %r13324; | |
setp.le.u32 %p11, %r34, %r13324; | |
mov.u32 %r13323, %r34; | |
@%p11 bra BB12_18; | |
st.local.v2.u32 [%rd2+24], {%r13324, %r34}; | |
mov.u32 %r11423, %r13324; | |
mov.u32 %r13324, %r34; | |
mov.u32 %r13323, %r11423; | |
BB12_18: | |
mov.u32 %r37, %r13323; | |
mov.u32 %r36, %r13324; | |
setp.le.u32 %p12, %r13317, %r37; | |
mov.u32 %r13319, %r37; | |
mov.u32 %r13320, %r36; | |
@%p12 bra BB12_20; | |
st.local.v4.u32 [%rd2+16], {%r37, %r36, %r13317, %r13318}; | |
mov.u32 %r11420, %r13318; | |
mov.u32 %r11422, %r13317; | |
mov.u32 %r13318, %r36; | |
mov.u32 %r13317, %r37; | |
mov.u32 %r13319, %r11422; | |
mov.u32 %r13320, %r11420; | |
BB12_20: | |
mov.u32 %r41, %r13317; | |
mov.u32 %r40, %r13318; | |
mov.u32 %r39, %r13319; | |
mov.u32 %r38, %r13320; | |
setp.le.u32 %p13, %r13301, %r41; | |
mov.u32 %r13305, %r41; | |
mov.u32 %r13306, %r40; | |
mov.u32 %r13307, %r39; | |
mov.u32 %r13308, %r38; | |
@%p13 bra BB12_22; | |
st.local.v4.u32 [%rd2], {%r41, %r40, %r39, %r38}; | |
st.local.v4.u32 [%rd2+16], {%r13301, %r13302, %r13303, %r13304}; | |
mov.u32 %r11410, %r13304; | |
mov.u32 %r11412, %r13303; | |
mov.u32 %r11414, %r13302; | |
mov.u32 %r11416, %r13301; | |
mov.u32 %r13304, %r38; | |
mov.u32 %r13303, %r39; | |
mov.u32 %r13302, %r40; | |
mov.u32 %r13301, %r41; | |
mov.u32 %r13305, %r11416; | |
mov.u32 %r13306, %r11414; | |
mov.u32 %r13307, %r11412; | |
mov.u32 %r13308, %r11410; | |
BB12_22: | |
mov.u32 %r13285, %r13301; | |
mov.u32 %r13286, %r13302; | |
mov.u32 %r13287, %r13303; | |
mov.u32 %r13288, %r13304; | |
mov.u32 %r13289, %r13305; | |
mov.u32 %r13290, %r13306; | |
mov.u32 %r13291, %r13307; | |
mov.u32 %r13292, %r13308; | |
mul.lo.s64 %rd521, %rd18, 1792; | |
add.s64 %rd522, %rd6, %rd521; | |
bfe.u32 %r5308, %r14, 22, 6; | |
mul.wide.u32 %rd523, %r5308, 28; | |
add.s64 %rd524, %rd522, %rd523; | |
ld.global.u32 %r50, [%rd524+-8]; | |
and.b32 %r5309, %r50, 65535; | |
mul.wide.u32 %rd525, %r5309, 1792; | |
add.s64 %rd526, %rd4, %rd525; | |
cvt.u64.u32 %rd23, %r5309; | |
bfe.u32 %r5310, %r50, 16, 6; | |
mul.wide.u32 %rd527, %r5310, 28; | |
add.s64 %rd528, %rd526, %rd527; | |
ld.global.u32 %r51, [%rd528+-12]; | |
and.b32 %r5311, %r51, 65535; | |
cvt.u64.u32 %rd24, %r5311; | |
bfe.u32 %r5312, %r51, 16, 6; | |
mul.wide.u32 %rd529, %r5311, 1792; | |
add.s64 %rd530, %rd415, %rd529; | |
mul.wide.u32 %rd531, %r5312, 28; | |
add.s64 %rd532, %rd530, %rd531; | |
ld.global.u32 %r5313, [%rd532]; | |
and.b32 %r5314, %r5313, 65535; | |
bfe.u32 %r5315, %r5313, 16, 6; | |
mul.wide.u32 %rd533, %r5314, 1792; | |
add.s64 %rd534, %rd414, %rd533; | |
mul.wide.u32 %rd535, %r5315, 28; | |
add.s64 %rd536, %rd534, %rd535; | |
ld.global.u32 %r5316, [%rd536]; | |
and.b32 %r5317, %r5316, 65535; | |
shl.b32 %r5318, %r5317, 6; | |
bfe.u32 %r5319, %r5316, 16, 6; | |
or.b32 %r52, %r5318, %r5319; | |
st.local.u32 [%rd2+32], %r52; | |
bfe.u32 %r5320, %r5313, 22, 6; | |
mul.wide.u32 %rd537, %r5320, 28; | |
add.s64 %rd538, %rd534, %rd537; | |
ld.global.u32 %r5321, [%rd538]; | |
and.b32 %r5322, %r5321, 65535; | |
shl.b32 %r5323, %r5322, 6; | |
bfe.u32 %r5324, %r5321, 16, 6; | |
or.b32 %r13338, %r5323, %r5324; | |
st.local.u32 [%rd2+36], %r13338; | |
setp.le.u32 %p14, %r52, %r13338; | |
mov.u32 %r13337, %r52; | |
@%p14 bra BB12_24; | |
st.local.v2.u32 [%rd2+32], {%r13338, %r52}; | |
mov.u32 %r11453, %r13338; | |
mov.u32 %r13338, %r52; | |
mov.u32 %r13337, %r11453; | |
BB12_24: | |
mov.u32 %r13333, %r13337; | |
mov.u32 %r13334, %r13338; | |
bfe.u32 %r5325, %r51, 22, 6; | |
mul.lo.s64 %rd539, %rd24, 1792; | |
add.s64 %rd540, %rd415, %rd539; | |
mul.wide.u32 %rd541, %r5325, 28; | |
add.s64 %rd542, %rd540, %rd541; | |
ld.global.u32 %r5326, [%rd542]; | |
and.b32 %r5327, %r5326, 65535; | |
bfe.u32 %r5328, %r5326, 16, 6; | |
mul.wide.u32 %rd543, %r5327, 1792; | |
add.s64 %rd544, %rd414, %rd543; | |
mul.wide.u32 %rd545, %r5328, 28; | |
add.s64 %rd546, %rd544, %rd545; | |
ld.global.u32 %r5329, [%rd546]; | |
and.b32 %r5330, %r5329, 65535; | |
shl.b32 %r5331, %r5330, 6; | |
bfe.u32 %r5332, %r5329, 16, 6; | |
or.b32 %r56, %r5331, %r5332; | |
st.local.u32 [%rd2+40], %r56; | |
bfe.u32 %r5333, %r5326, 22, 6; | |
mul.wide.u32 %rd547, %r5333, 28; | |
add.s64 %rd548, %rd544, %rd547; | |
ld.global.u32 %r5334, [%rd548]; | |
and.b32 %r5335, %r5334, 65535; | |
shl.b32 %r5336, %r5335, 6; | |
bfe.u32 %r5337, %r5334, 16, 6; | |
or.b32 %r13340, %r5336, %r5337; | |
st.local.u32 [%rd2+44], %r13340; | |
setp.le.u32 %p15, %r56, %r13340; | |
mov.u32 %r13339, %r56; | |
@%p15 bra BB12_26; | |
st.local.v2.u32 [%rd2+40], {%r13340, %r56}; | |
mov.u32 %r11459, %r13340; | |
mov.u32 %r13340, %r56; | |
mov.u32 %r13339, %r11459; | |
BB12_26: | |
mov.u32 %r59, %r13339; | |
mov.u32 %r58, %r13340; | |
setp.le.u32 %p16, %r13333, %r59; | |
mov.u32 %r13335, %r59; | |
mov.u32 %r13336, %r58; | |
@%p16 bra BB12_28; | |
st.local.v4.u32 [%rd2+32], {%r59, %r58, %r13333, %r13334}; | |
mov.u32 %r11456, %r13334; | |
mov.u32 %r11458, %r13333; | |
mov.u32 %r13334, %r58; | |
mov.u32 %r13333, %r59; | |
mov.u32 %r13335, %r11458; | |
mov.u32 %r13336, %r11456; | |
BB12_28: | |
mov.u32 %r13325, %r13333; | |
mov.u32 %r13326, %r13334; | |
mov.u32 %r13327, %r13335; | |
mov.u32 %r13328, %r13336; | |
mul.lo.s64 %rd549, %rd23, 1792; | |
add.s64 %rd550, %rd4, %rd549; | |
bfe.u32 %r5338, %r50, 22, 6; | |
mul.wide.u32 %rd551, %r5338, 28; | |
add.s64 %rd552, %rd550, %rd551; | |
ld.global.u32 %r64, [%rd552+-12]; | |
and.b32 %r5339, %r64, 65535; | |
cvt.u64.u32 %rd25, %r5339; | |
bfe.u32 %r5340, %r64, 16, 6; | |
mul.wide.u32 %rd553, %r5339, 1792; | |
add.s64 %rd554, %rd415, %rd553; | |
mul.wide.u32 %rd555, %r5340, 28; | |
add.s64 %rd556, %rd554, %rd555; | |
ld.global.u32 %r5341, [%rd556]; | |
and.b32 %r5342, %r5341, 65535; | |
bfe.u32 %r5343, %r5341, 16, 6; | |
mul.wide.u32 %rd557, %r5342, 1792; | |
add.s64 %rd558, %rd414, %rd557; | |
mul.wide.u32 %rd559, %r5343, 28; | |
add.s64 %rd560, %rd558, %rd559; | |
ld.global.u32 %r5344, [%rd560]; | |
and.b32 %r5345, %r5344, 65535; | |
shl.b32 %r5346, %r5345, 6; | |
bfe.u32 %r5347, %r5344, 16, 6; | |
or.b32 %r65, %r5346, %r5347; | |
st.local.u32 [%rd2+48], %r65; | |
bfe.u32 %r5348, %r5341, 22, 6; | |
mul.wide.u32 %rd561, %r5348, 28; | |
add.s64 %rd562, %rd558, %rd561; | |
ld.global.u32 %r5349, [%rd562]; | |
and.b32 %r5350, %r5349, 65535; | |
shl.b32 %r5351, %r5350, 6; | |
bfe.u32 %r5352, %r5349, 16, 6; | |
or.b32 %r13346, %r5351, %r5352; | |
st.local.u32 [%rd2+52], %r13346; | |
setp.le.u32 %p17, %r65, %r13346; | |
mov.u32 %r13345, %r65; | |
@%p17 bra BB12_30; | |
st.local.v2.u32 [%rd2+48], {%r13346, %r65}; | |
mov.u32 %r11473, %r13346; | |
mov.u32 %r13346, %r65; | |
mov.u32 %r13345, %r11473; | |
BB12_30: | |
mov.u32 %r13341, %r13345; | |
mov.u32 %r13342, %r13346; | |
bfe.u32 %r5353, %r64, 22, 6; | |
mul.lo.s64 %rd563, %rd25, 1792; | |
add.s64 %rd564, %rd415, %rd563; | |
mul.wide.u32 %rd565, %r5353, 28; | |
add.s64 %rd566, %rd564, %rd565; | |
ld.global.u32 %r5354, [%rd566]; | |
and.b32 %r5355, %r5354, 65535; | |
bfe.u32 %r5356, %r5354, 16, 6; | |
mul.wide.u32 %rd567, %r5355, 1792; | |
add.s64 %rd568, %rd414, %rd567; | |
mul.wide.u32 %rd569, %r5356, 28; | |
add.s64 %rd570, %rd568, %rd569; | |
ld.global.u32 %r5357, [%rd570]; | |
and.b32 %r5358, %r5357, 65535; | |
shl.b32 %r5359, %r5358, 6; | |
bfe.u32 %r5360, %r5357, 16, 6; | |
or.b32 %r69, %r5359, %r5360; | |
st.local.u32 [%rd2+56], %r69; | |
bfe.u32 %r5361, %r5354, 22, 6; | |
mul.wide.u32 %rd571, %r5361, 28; | |
add.s64 %rd572, %rd568, %rd571; | |
ld.global.u32 %r5362, [%rd572]; | |
and.b32 %r5363, %r5362, 65535; | |
shl.b32 %r5364, %r5363, 6; | |
bfe.u32 %r5365, %r5362, 16, 6; | |
or.b32 %r13348, %r5364, %r5365; | |
st.local.u32 [%rd2+60], %r13348; | |
setp.le.u32 %p18, %r69, %r13348; | |
mov.u32 %r13347, %r69; | |
@%p18 bra BB12_32; | |
st.local.v2.u32 [%rd2+56], {%r13348, %r69}; | |
mov.u32 %r11479, %r13348; | |
mov.u32 %r13348, %r69; | |
mov.u32 %r13347, %r11479; | |
BB12_32: | |
mov.u32 %r72, %r13347; | |
mov.u32 %r71, %r13348; | |
setp.le.u32 %p19, %r13341, %r72; | |
mov.u32 %r13343, %r72; | |
mov.u32 %r13344, %r71; | |
@%p19 bra BB12_34; | |
st.local.v4.u32 [%rd2+48], {%r72, %r71, %r13341, %r13342}; | |
mov.u32 %r11476, %r13342; | |
mov.u32 %r11478, %r13341; | |
mov.u32 %r13342, %r71; | |
mov.u32 %r13341, %r72; | |
mov.u32 %r13343, %r11478; | |
mov.u32 %r13344, %r11476; | |
BB12_34: | |
mov.u32 %r76, %r13341; | |
mov.u32 %r75, %r13342; | |
mov.u32 %r74, %r13343; | |
mov.u32 %r73, %r13344; | |
setp.le.u32 %p20, %r13325, %r76; | |
mov.u32 %r13329, %r76; | |
mov.u32 %r13330, %r75; | |
mov.u32 %r13331, %r74; | |
mov.u32 %r13332, %r73; | |
@%p20 bra BB12_36; | |
st.local.v4.u32 [%rd2+32], {%r76, %r75, %r74, %r73}; | |
st.local.v4.u32 [%rd2+48], {%r13325, %r13326, %r13327, %r13328}; | |
mov.u32 %r11466, %r13328; | |
mov.u32 %r11468, %r13327; | |
mov.u32 %r11470, %r13326; | |
mov.u32 %r11472, %r13325; | |
mov.u32 %r13328, %r73; | |
mov.u32 %r13327, %r74; | |
mov.u32 %r13326, %r75; | |
mov.u32 %r13325, %r76; | |
mov.u32 %r13329, %r11472; | |
mov.u32 %r13330, %r11470; | |
mov.u32 %r13331, %r11468; | |
mov.u32 %r13332, %r11466; | |
BB12_36: | |
mov.u32 %r84, %r13325; | |
mov.u32 %r83, %r13326; | |
mov.u32 %r82, %r13327; | |
mov.u32 %r81, %r13328; | |
mov.u32 %r80, %r13329; | |
mov.u32 %r79, %r13330; | |
mov.u32 %r78, %r13331; | |
mov.u32 %r77, %r13332; | |
setp.le.u32 %p21, %r13285, %r84; | |
mov.u32 %r13293, %r84; | |
mov.u32 %r13294, %r83; | |
mov.u32 %r13295, %r82; | |
mov.u32 %r13296, %r81; | |
mov.u32 %r13297, %r80; | |
mov.u32 %r13298, %r79; | |
mov.u32 %r13299, %r78; | |
mov.u32 %r13300, %r77; | |
@%p21 bra BB12_38; | |
st.local.v4.u32 [%rd2], {%r84, %r83, %r82, %r81}; | |
st.local.v4.u32 [%rd2+32], {%r13285, %r13286, %r13287, %r13288}; | |
st.local.v4.u32 [%rd2+16], {%r80, %r79, %r78, %r77}; | |
st.local.v4.u32 [%rd2+48], {%r13289, %r13290, %r13291, %r13292}; | |
mov.u32 %r11438, %r13292; | |
mov.u32 %r11440, %r13291; | |
mov.u32 %r11442, %r13290; | |
mov.u32 %r11444, %r13289; | |
mov.u32 %r11446, %r13288; | |
mov.u32 %r11448, %r13287; | |
mov.u32 %r11450, %r13286; | |
mov.u32 %r11452, %r13285; | |
mov.u32 %r13292, %r77; | |
mov.u32 %r13291, %r78; | |
mov.u32 %r13290, %r79; | |
mov.u32 %r13289, %r80; | |
mov.u32 %r13288, %r81; | |
mov.u32 %r13287, %r82; | |
mov.u32 %r13286, %r83; | |
mov.u32 %r13285, %r84; | |
mov.u32 %r13293, %r11452; | |
mov.u32 %r13294, %r11450; | |
mov.u32 %r13295, %r11448; | |
mov.u32 %r13296, %r11446; | |
mov.u32 %r13297, %r11444; | |
mov.u32 %r13298, %r11442; | |
mov.u32 %r13299, %r11440; | |
mov.u32 %r13300, %r11438; | |
BB12_38: | |
mov.u32 %r13253, %r13285; | |
mov.u32 %r13254, %r13286; | |
mov.u32 %r13255, %r13287; | |
mov.u32 %r13256, %r13288; | |
mov.u32 %r13257, %r13289; | |
mov.u32 %r13258, %r13290; | |
mov.u32 %r13259, %r13291; | |
mov.u32 %r13260, %r13292; | |
mov.u32 %r13261, %r13293; | |
mov.u32 %r13262, %r13294; | |
mov.u32 %r13263, %r13295; | |
mov.u32 %r13264, %r13296; | |
mov.u32 %r13265, %r13297; | |
mov.u32 %r13266, %r13298; | |
mov.u32 %r13267, %r13299; | |
mov.u32 %r13268, %r13300; | |
mul.lo.s64 %rd573, %rd17, 1792; | |
add.s64 %rd574, %rd4, %rd573; | |
bfe.u32 %r5366, %r13, 22, 6; | |
mul.wide.u32 %rd575, %r5366, 28; | |
add.s64 %rd576, %rd574, %rd575; | |
ld.global.u32 %r101, [%rd576+-8]; | |
and.b32 %r5367, %r101, 65535; | |
mul.wide.u32 %rd577, %r5367, 1792; | |
add.s64 %rd578, %rd6, %rd577; | |
bfe.u32 %r5368, %r101, 16, 6; | |
mul.wide.u32 %rd579, %r5368, 28; | |
add.s64 %rd580, %rd578, %rd579; | |
ld.global.u32 %r102, [%rd580+-8]; | |
and.b32 %r5369, %r102, 65535; | |
mul.wide.u32 %rd581, %r5369, 1792; | |
add.s64 %rd582, %rd4, %rd581; | |
cvt.u64.u32 %rd26, %r5367; | |
cvt.u64.u32 %rd27, %r5369; | |
bfe.u32 %r5370, %r102, 16, 6; | |
mul.wide.u32 %rd583, %r5370, 28; | |
add.s64 %rd584, %rd582, %rd583; | |
ld.global.u32 %r103, [%rd584+-12]; | |
and.b32 %r5371, %r103, 65535; | |
cvt.u64.u32 %rd28, %r5371; | |
bfe.u32 %r5372, %r103, 16, 6; | |
mul.wide.u32 %rd585, %r5371, 1792; | |
add.s64 %rd586, %rd415, %rd585; | |
mul.wide.u32 %rd587, %r5372, 28; | |
add.s64 %rd588, %rd586, %rd587; | |
ld.global.u32 %r5373, [%rd588]; | |
and.b32 %r5374, %r5373, 65535; | |
bfe.u32 %r5375, %r5373, 16, 6; | |
mul.wide.u32 %rd589, %r5374, 1792; | |
add.s64 %rd590, %rd414, %rd589; | |
mul.wide.u32 %rd591, %r5375, 28; | |
add.s64 %rd592, %rd590, %rd591; | |
ld.global.u32 %r5376, [%rd592]; | |
and.b32 %r5377, %r5376, 65535; | |
shl.b32 %r5378, %r5377, 6; | |
bfe.u32 %r5379, %r5376, 16, 6; | |
or.b32 %r104, %r5378, %r5379; | |
st.local.u32 [%rd2+64], %r104; | |
bfe.u32 %r5380, %r5373, 22, 6; | |
mul.wide.u32 %rd593, %r5380, 28; | |
add.s64 %rd594, %rd590, %rd593; | |
ld.global.u32 %r5381, [%rd594]; | |
and.b32 %r5382, %r5381, 65535; | |
shl.b32 %r5383, %r5382, 6; | |
bfe.u32 %r5384, %r5381, 16, 6; | |
or.b32 %r13378, %r5383, %r5384; | |
st.local.u32 [%rd2+68], %r13378; | |
setp.le.u32 %p22, %r104, %r13378; | |
mov.u32 %r13377, %r104; | |
@%p22 bra BB12_40; | |
st.local.v2.u32 [%rd2+64], {%r13378, %r104}; | |
mov.u32 %r11541, %r13378; | |
mov.u32 %r13378, %r104; | |
mov.u32 %r13377, %r11541; | |
BB12_40: | |
mov.u32 %r13373, %r13377; | |
mov.u32 %r13374, %r13378; | |
bfe.u32 %r5385, %r103, 22, 6; | |
mul.lo.s64 %rd595, %rd28, 1792; | |
add.s64 %rd596, %rd415, %rd595; | |
mul.wide.u32 %rd597, %r5385, 28; | |
add.s64 %rd598, %rd596, %rd597; | |
ld.global.u32 %r5386, [%rd598]; | |
and.b32 %r5387, %r5386, 65535; | |
bfe.u32 %r5388, %r5386, 16, 6; | |
mul.wide.u32 %rd599, %r5387, 1792; | |
add.s64 %rd600, %rd414, %rd599; | |
mul.wide.u32 %rd601, %r5388, 28; | |
add.s64 %rd602, %rd600, %rd601; | |
ld.global.u32 %r5389, [%rd602]; | |
and.b32 %r5390, %r5389, 65535; | |
shl.b32 %r5391, %r5390, 6; | |
bfe.u32 %r5392, %r5389, 16, 6; | |
or.b32 %r108, %r5391, %r5392; | |
st.local.u32 [%rd2+72], %r108; | |
bfe.u32 %r5393, %r5386, 22, 6; | |
mul.wide.u32 %rd603, %r5393, 28; | |
add.s64 %rd604, %rd600, %rd603; | |
ld.global.u32 %r5394, [%rd604]; | |
and.b32 %r5395, %r5394, 65535; | |
shl.b32 %r5396, %r5395, 6; | |
bfe.u32 %r5397, %r5394, 16, 6; | |
or.b32 %r13380, %r5396, %r5397; | |
st.local.u32 [%rd2+76], %r13380; | |
setp.le.u32 %p23, %r108, %r13380; | |
mov.u32 %r13379, %r108; | |
@%p23 bra BB12_42; | |
st.local.v2.u32 [%rd2+72], {%r13380, %r108}; | |
mov.u32 %r11547, %r13380; | |
mov.u32 %r13380, %r108; | |
mov.u32 %r13379, %r11547; | |
BB12_42: | |
mov.u32 %r111, %r13379; | |
mov.u32 %r110, %r13380; | |
setp.le.u32 %p24, %r13373, %r111; | |
mov.u32 %r13375, %r111; | |
mov.u32 %r13376, %r110; | |
@%p24 bra BB12_44; | |
st.local.v4.u32 [%rd2+64], {%r111, %r110, %r13373, %r13374}; | |
mov.u32 %r11544, %r13374; | |
mov.u32 %r11546, %r13373; | |
mov.u32 %r13374, %r110; | |
mov.u32 %r13373, %r111; | |
mov.u32 %r13375, %r11546; | |
mov.u32 %r13376, %r11544; | |
BB12_44: | |
mov.u32 %r13365, %r13373; | |
mov.u32 %r13366, %r13374; | |
mov.u32 %r13367, %r13375; | |
mov.u32 %r13368, %r13376; | |
mul.lo.s64 %rd605, %rd27, 1792; | |
add.s64 %rd606, %rd4, %rd605; | |
bfe.u32 %r5398, %r102, 22, 6; | |
mul.wide.u32 %rd607, %r5398, 28; | |
add.s64 %rd608, %rd606, %rd607; | |
ld.global.u32 %r116, [%rd608+-12]; | |
and.b32 %r5399, %r116, 65535; | |
cvt.u64.u32 %rd29, %r5399; | |
bfe.u32 %r5400, %r116, 16, 6; | |
mul.wide.u32 %rd609, %r5399, 1792; | |
add.s64 %rd610, %rd415, %rd609; | |
mul.wide.u32 %rd611, %r5400, 28; | |
add.s64 %rd612, %rd610, %rd611; | |
ld.global.u32 %r5401, [%rd612]; | |
and.b32 %r5402, %r5401, 65535; | |
bfe.u32 %r5403, %r5401, 16, 6; | |
mul.wide.u32 %rd613, %r5402, 1792; | |
add.s64 %rd614, %rd414, %rd613; | |
mul.wide.u32 %rd615, %r5403, 28; | |
add.s64 %rd616, %rd614, %rd615; | |
ld.global.u32 %r5404, [%rd616]; | |
and.b32 %r5405, %r5404, 65535; | |
shl.b32 %r5406, %r5405, 6; | |
bfe.u32 %r5407, %r5404, 16, 6; | |
or.b32 %r117, %r5406, %r5407; | |
st.local.u32 [%rd2+80], %r117; | |
bfe.u32 %r5408, %r5401, 22, 6; | |
mul.wide.u32 %rd617, %r5408, 28; | |
add.s64 %rd618, %rd614, %rd617; | |
ld.global.u32 %r5409, [%rd618]; | |
and.b32 %r5410, %r5409, 65535; | |
shl.b32 %r5411, %r5410, 6; | |
bfe.u32 %r5412, %r5409, 16, 6; | |
or.b32 %r13386, %r5411, %r5412; | |
st.local.u32 [%rd2+84], %r13386; | |
setp.le.u32 %p25, %r117, %r13386; | |
mov.u32 %r13385, %r117; | |
@%p25 bra BB12_46; | |
st.local.v2.u32 [%rd2+80], {%r13386, %r117}; | |
mov.u32 %r11561, %r13386; | |
mov.u32 %r13386, %r117; | |
mov.u32 %r13385, %r11561; | |
BB12_46: | |
mov.u32 %r13381, %r13385; | |
mov.u32 %r13382, %r13386; | |
bfe.u32 %r5413, %r116, 22, 6; | |
mul.lo.s64 %rd619, %rd29, 1792; | |
add.s64 %rd620, %rd415, %rd619; | |
mul.wide.u32 %rd621, %r5413, 28; | |
add.s64 %rd622, %rd620, %rd621; | |
ld.global.u32 %r5414, [%rd622]; | |
and.b32 %r5415, %r5414, 65535; | |
bfe.u32 %r5416, %r5414, 16, 6; | |
mul.wide.u32 %rd623, %r5415, 1792; | |
add.s64 %rd624, %rd414, %rd623; | |
mul.wide.u32 %rd625, %r5416, 28; | |
add.s64 %rd626, %rd624, %rd625; | |
ld.global.u32 %r5417, [%rd626]; | |
and.b32 %r5418, %r5417, 65535; | |
shl.b32 %r5419, %r5418, 6; | |
bfe.u32 %r5420, %r5417, 16, 6; | |
or.b32 %r121, %r5419, %r5420; | |
st.local.u32 [%rd2+88], %r121; | |
bfe.u32 %r5421, %r5414, 22, 6; | |
mul.wide.u32 %rd627, %r5421, 28; | |
add.s64 %rd628, %rd624, %rd627; | |
ld.global.u32 %r5422, [%rd628]; | |
and.b32 %r5423, %r5422, 65535; | |
shl.b32 %r5424, %r5423, 6; | |
bfe.u32 %r5425, %r5422, 16, 6; | |
or.b32 %r13388, %r5424, %r5425; | |
st.local.u32 [%rd2+92], %r13388; | |
setp.le.u32 %p26, %r121, %r13388; | |
mov.u32 %r13387, %r121; | |
@%p26 bra BB12_48; | |
st.local.v2.u32 [%rd2+88], {%r13388, %r121}; | |
mov.u32 %r11567, %r13388; | |
mov.u32 %r13388, %r121; | |
mov.u32 %r13387, %r11567; | |
BB12_48: | |
mov.u32 %r124, %r13387; | |
mov.u32 %r123, %r13388; | |
setp.le.u32 %p27, %r13381, %r124; | |
mov.u32 %r13383, %r124; | |
mov.u32 %r13384, %r123; | |
@%p27 bra BB12_50; | |
st.local.v4.u32 [%rd2+80], {%r124, %r123, %r13381, %r13382}; | |
mov.u32 %r11564, %r13382; | |
mov.u32 %r11566, %r13381; | |
mov.u32 %r13382, %r123; | |
mov.u32 %r13381, %r124; | |
mov.u32 %r13383, %r11566; | |
mov.u32 %r13384, %r11564; | |
BB12_50: | |
mov.u32 %r128, %r13381; | |
mov.u32 %r127, %r13382; | |
mov.u32 %r126, %r13383; | |
mov.u32 %r125, %r13384; | |
setp.le.u32 %p28, %r13365, %r128; | |
mov.u32 %r13369, %r128; | |
mov.u32 %r13370, %r127; | |
mov.u32 %r13371, %r126; | |
mov.u32 %r13372, %r125; | |
@%p28 bra BB12_52; | |
st.local.v4.u32 [%rd2+64], {%r128, %r127, %r126, %r125}; | |
st.local.v4.u32 [%rd2+80], {%r13365, %r13366, %r13367, %r13368}; | |
mov.u32 %r11554, %r13368; | |
mov.u32 %r11556, %r13367; | |
mov.u32 %r11558, %r13366; | |
mov.u32 %r11560, %r13365; | |
mov.u32 %r13368, %r125; | |
mov.u32 %r13367, %r126; | |
mov.u32 %r13366, %r127; | |
mov.u32 %r13365, %r128; | |
mov.u32 %r13369, %r11560; | |
mov.u32 %r13370, %r11558; | |
mov.u32 %r13371, %r11556; | |
mov.u32 %r13372, %r11554; | |
BB12_52: | |
mov.u32 %r13349, %r13365; | |
mov.u32 %r13350, %r13366; | |
mov.u32 %r13351, %r13367; | |
mov.u32 %r13352, %r13368; | |
mov.u32 %r13353, %r13369; | |
mov.u32 %r13354, %r13370; | |
mov.u32 %r13355, %r13371; | |
mov.u32 %r13356, %r13372; | |
mul.lo.s64 %rd629, %rd26, 1792; | |
add.s64 %rd630, %rd6, %rd629; | |
bfe.u32 %r5426, %r101, 22, 6; | |
mul.wide.u32 %rd631, %r5426, 28; | |
add.s64 %rd632, %rd630, %rd631; | |
ld.global.u32 %r137, [%rd632+-8]; | |
and.b32 %r5427, %r137, 65535; | |
mul.wide.u32 %rd633, %r5427, 1792; | |
add.s64 %rd634, %rd4, %rd633; | |
cvt.u64.u32 %rd30, %r5427; | |
bfe.u32 %r5428, %r137, 16, 6; | |
mul.wide.u32 %rd635, %r5428, 28; | |
add.s64 %rd636, %rd634, %rd635; | |
ld.global.u32 %r138, [%rd636+-12]; | |
and.b32 %r5429, %r138, 65535; | |
cvt.u64.u32 %rd31, %r5429; | |
bfe.u32 %r5430, %r138, 16, 6; | |
mul.wide.u32 %rd637, %r5429, 1792; | |
add.s64 %rd638, %rd415, %rd637; | |
mul.wide.u32 %rd639, %r5430, 28; | |
add.s64 %rd640, %rd638, %rd639; | |
ld.global.u32 %r5431, [%rd640]; | |
and.b32 %r5432, %r5431, 65535; | |
bfe.u32 %r5433, %r5431, 16, 6; | |
mul.wide.u32 %rd641, %r5432, 1792; | |
add.s64 %rd642, %rd414, %rd641; | |
mul.wide.u32 %rd643, %r5433, 28; | |
add.s64 %rd644, %rd642, %rd643; | |
ld.global.u32 %r5434, [%rd644]; | |
and.b32 %r5435, %r5434, 65535; | |
shl.b32 %r5436, %r5435, 6; | |
bfe.u32 %r5437, %r5434, 16, 6; | |
or.b32 %r139, %r5436, %r5437; | |
st.local.u32 [%rd2+96], %r139; | |
bfe.u32 %r5438, %r5431, 22, 6; | |
mul.wide.u32 %rd645, %r5438, 28; | |
add.s64 %rd646, %rd642, %rd645; | |
ld.global.u32 %r5439, [%rd646]; | |
and.b32 %r5440, %r5439, 65535; | |
shl.b32 %r5441, %r5440, 6; | |
bfe.u32 %r5442, %r5439, 16, 6; | |
or.b32 %r13402, %r5441, %r5442; | |
st.local.u32 [%rd2+100], %r13402; | |
setp.le.u32 %p29, %r139, %r13402; | |
mov.u32 %r13401, %r139; | |
@%p29 bra BB12_54; | |
st.local.v2.u32 [%rd2+96], {%r13402, %r139}; | |
mov.u32 %r11597, %r13402; | |
mov.u32 %r13402, %r139; | |
mov.u32 %r13401, %r11597; | |
BB12_54: | |
mov.u32 %r13397, %r13401; | |
mov.u32 %r13398, %r13402; | |
bfe.u32 %r5443, %r138, 22, 6; | |
mul.lo.s64 %rd647, %rd31, 1792; | |
add.s64 %rd648, %rd415, %rd647; | |
mul.wide.u32 %rd649, %r5443, 28; | |
add.s64 %rd650, %rd648, %rd649; | |
ld.global.u32 %r5444, [%rd650]; | |
and.b32 %r5445, %r5444, 65535; | |
bfe.u32 %r5446, %r5444, 16, 6; | |
mul.wide.u32 %rd651, %r5445, 1792; | |
add.s64 %rd652, %rd414, %rd651; | |
mul.wide.u32 %rd653, %r5446, 28; | |
add.s64 %rd654, %rd652, %rd653; | |
ld.global.u32 %r5447, [%rd654]; | |
and.b32 %r5448, %r5447, 65535; | |
shl.b32 %r5449, %r5448, 6; | |
bfe.u32 %r5450, %r5447, 16, 6; | |
or.b32 %r143, %r5449, %r5450; | |
st.local.u32 [%rd2+104], %r143; | |
bfe.u32 %r5451, %r5444, 22, 6; | |
mul.wide.u32 %rd655, %r5451, 28; | |
add.s64 %rd656, %rd652, %rd655; | |
ld.global.u32 %r5452, [%rd656]; | |
and.b32 %r5453, %r5452, 65535; | |
shl.b32 %r5454, %r5453, 6; | |
bfe.u32 %r5455, %r5452, 16, 6; | |
or.b32 %r13404, %r5454, %r5455; | |
st.local.u32 [%rd2+108], %r13404; | |
setp.le.u32 %p30, %r143, %r13404; | |
mov.u32 %r13403, %r143; | |
@%p30 bra BB12_56; | |
st.local.v2.u32 [%rd2+104], {%r13404, %r143}; | |
mov.u32 %r11603, %r13404; | |
mov.u32 %r13404, %r143; | |
mov.u32 %r13403, %r11603; | |
BB12_56: | |
mov.u32 %r146, %r13403; | |
mov.u32 %r145, %r13404; | |
setp.le.u32 %p31, %r13397, %r146; | |
mov.u32 %r13399, %r146; | |
mov.u32 %r13400, %r145; | |
@%p31 bra BB12_58; | |
st.local.v4.u32 [%rd2+96], {%r146, %r145, %r13397, %r13398}; | |
mov.u32 %r11600, %r13398; | |
mov.u32 %r11602, %r13397; | |
mov.u32 %r13398, %r145; | |
mov.u32 %r13397, %r146; | |
mov.u32 %r13399, %r11602; | |
mov.u32 %r13400, %r11600; | |
BB12_58: | |
mov.u32 %r13389, %r13397; | |
mov.u32 %r13390, %r13398; | |
mov.u32 %r13391, %r13399; | |
mov.u32 %r13392, %r13400; | |
mul.lo.s64 %rd657, %rd30, 1792; | |
add.s64 %rd658, %rd4, %rd657; | |
bfe.u32 %r5456, %r137, 22, 6; | |
mul.wide.u32 %rd659, %r5456, 28; | |
add.s64 %rd660, %rd658, %rd659; | |
ld.global.u32 %r151, [%rd660+-12]; | |
and.b32 %r5457, %r151, 65535; | |
cvt.u64.u32 %rd32, %r5457; | |
bfe.u32 %r5458, %r151, 16, 6; | |
mul.wide.u32 %rd661, %r5457, 1792; | |
add.s64 %rd662, %rd415, %rd661; | |
mul.wide.u32 %rd663, %r5458, 28; | |
add.s64 %rd664, %rd662, %rd663; | |
ld.global.u32 %r5459, [%rd664]; | |
and.b32 %r5460, %r5459, 65535; | |
bfe.u32 %r5461, %r5459, 16, 6; | |
mul.wide.u32 %rd665, %r5460, 1792; | |
add.s64 %rd666, %rd414, %rd665; | |
mul.wide.u32 %rd667, %r5461, 28; | |
add.s64 %rd668, %rd666, %rd667; | |
ld.global.u32 %r5462, [%rd668]; | |
and.b32 %r5463, %r5462, 65535; | |
shl.b32 %r5464, %r5463, 6; | |
bfe.u32 %r5465, %r5462, 16, 6; | |
or.b32 %r152, %r5464, %r5465; | |
st.local.u32 [%rd2+112], %r152; | |
bfe.u32 %r5466, %r5459, 22, 6; | |
mul.wide.u32 %rd669, %r5466, 28; | |
add.s64 %rd670, %rd666, %rd669; | |
ld.global.u32 %r5467, [%rd670]; | |
and.b32 %r5468, %r5467, 65535; | |
shl.b32 %r5469, %r5468, 6; | |
bfe.u32 %r5470, %r5467, 16, 6; | |
or.b32 %r13410, %r5469, %r5470; | |
st.local.u32 [%rd2+116], %r13410; | |
setp.le.u32 %p32, %r152, %r13410; | |
mov.u32 %r13409, %r152; | |
@%p32 bra BB12_60; | |
st.local.v2.u32 [%rd2+112], {%r13410, %r152}; | |
mov.u32 %r11617, %r13410; | |
mov.u32 %r13410, %r152; | |
mov.u32 %r13409, %r11617; | |
BB12_60: | |
mov.u32 %r13405, %r13409; | |
mov.u32 %r13406, %r13410; | |
bfe.u32 %r5471, %r151, 22, 6; | |
mul.lo.s64 %rd671, %rd32, 1792; | |
add.s64 %rd672, %rd415, %rd671; | |
mul.wide.u32 %rd673, %r5471, 28; | |
add.s64 %rd674, %rd672, %rd673; | |
ld.global.u32 %r5472, [%rd674]; | |
and.b32 %r5473, %r5472, 65535; | |
bfe.u32 %r5474, %r5472, 16, 6; | |
mul.wide.u32 %rd675, %r5473, 1792; | |
add.s64 %rd676, %rd414, %rd675; | |
mul.wide.u32 %rd677, %r5474, 28; | |
add.s64 %rd678, %rd676, %rd677; | |
ld.global.u32 %r5475, [%rd678]; | |
and.b32 %r5476, %r5475, 65535; | |
shl.b32 %r5477, %r5476, 6; | |
bfe.u32 %r5478, %r5475, 16, 6; | |
or.b32 %r156, %r5477, %r5478; | |
st.local.u32 [%rd2+120], %r156; | |
bfe.u32 %r5479, %r5472, 22, 6; | |
mul.wide.u32 %rd679, %r5479, 28; | |
add.s64 %rd680, %rd676, %rd679; | |
ld.global.u32 %r5480, [%rd680]; | |
and.b32 %r5481, %r5480, 65535; | |
shl.b32 %r5482, %r5481, 6; | |
bfe.u32 %r5483, %r5480, 16, 6; | |
or.b32 %r13412, %r5482, %r5483; | |
st.local.u32 [%rd2+124], %r13412; | |
setp.le.u32 %p33, %r156, %r13412; | |
mov.u32 %r13411, %r156; | |
@%p33 bra BB12_62; | |
st.local.v2.u32 [%rd2+120], {%r13412, %r156}; | |
mov.u32 %r11623, %r13412; | |
mov.u32 %r13412, %r156; | |
mov.u32 %r13411, %r11623; | |
BB12_62: | |
mov.u32 %r159, %r13411; | |
mov.u32 %r158, %r13412; | |
setp.le.u32 %p34, %r13405, %r159; | |
mov.u32 %r13407, %r159; | |
mov.u32 %r13408, %r158; | |
@%p34 bra BB12_64; | |
st.local.v4.u32 [%rd2+112], {%r159, %r158, %r13405, %r13406}; | |
mov.u32 %r11620, %r13406; | |
mov.u32 %r11622, %r13405; | |
mov.u32 %r13406, %r158; | |
mov.u32 %r13405, %r159; | |
mov.u32 %r13407, %r11622; | |
mov.u32 %r13408, %r11620; | |
BB12_64: | |
mov.u32 %r163, %r13405; | |
mov.u32 %r162, %r13406; | |
mov.u32 %r161, %r13407; | |
mov.u32 %r160, %r13408; | |
setp.le.u32 %p35, %r13389, %r163; | |
mov.u32 %r13393, %r163; | |
mov.u32 %r13394, %r162; | |
mov.u32 %r13395, %r161; | |
mov.u32 %r13396, %r160; | |
@%p35 bra BB12_66; | |
st.local.v4.u32 [%rd2+96], {%r163, %r162, %r161, %r160}; | |
st.local.v4.u32 [%rd2+112], {%r13389, %r13390, %r13391, %r13392}; | |
mov.u32 %r11610, %r13392; | |
mov.u32 %r11612, %r13391; | |
mov.u32 %r11614, %r13390; | |
mov.u32 %r11616, %r13389; | |
mov.u32 %r13392, %r160; | |
mov.u32 %r13391, %r161; | |
mov.u32 %r13390, %r162; | |
mov.u32 %r13389, %r163; | |
mov.u32 %r13393, %r11616; | |
mov.u32 %r13394, %r11614; | |
mov.u32 %r13395, %r11612; | |
mov.u32 %r13396, %r11610; | |
BB12_66: | |
mov.u32 %r171, %r13389; | |
mov.u32 %r170, %r13390; | |
mov.u32 %r169, %r13391; | |
mov.u32 %r168, %r13392; | |
mov.u32 %r167, %r13393; | |
mov.u32 %r166, %r13394; | |
mov.u32 %r165, %r13395; | |
mov.u32 %r164, %r13396; | |
setp.le.u32 %p36, %r13349, %r171; | |
mov.u32 %r13357, %r171; | |
mov.u32 %r13358, %r170; | |
mov.u32 %r13359, %r169; | |
mov.u32 %r13360, %r168; | |
mov.u32 %r13361, %r167; | |
mov.u32 %r13362, %r166; | |
mov.u32 %r13363, %r165; | |
mov.u32 %r13364, %r164; | |
@%p36 bra BB12_68; | |
st.local.v4.u32 [%rd2+64], {%r171, %r170, %r169, %r168}; | |
st.local.v4.u32 [%rd2+96], {%r13349, %r13350, %r13351, %r13352}; | |
st.local.v4.u32 [%rd2+80], {%r167, %r166, %r165, %r164}; | |
st.local.v4.u32 [%rd2+112], {%r13353, %r13354, %r13355, %r13356}; | |
mov.u32 %r11582, %r13356; | |
mov.u32 %r11584, %r13355; | |
mov.u32 %r11586, %r13354; | |
mov.u32 %r11588, %r13353; | |
mov.u32 %r11590, %r13352; | |
mov.u32 %r11592, %r13351; | |
mov.u32 %r11594, %r13350; | |
mov.u32 %r11596, %r13349; | |
mov.u32 %r13356, %r164; | |
mov.u32 %r13355, %r165; | |
mov.u32 %r13354, %r166; | |
mov.u32 %r13353, %r167; | |
mov.u32 %r13352, %r168; | |
mov.u32 %r13351, %r169; | |
mov.u32 %r13350, %r170; | |
mov.u32 %r13349, %r171; | |
mov.u32 %r13357, %r11596; | |
mov.u32 %r13358, %r11594; | |
mov.u32 %r13359, %r11592; | |
mov.u32 %r13360, %r11590; | |
mov.u32 %r13361, %r11588; | |
mov.u32 %r13362, %r11586; | |
mov.u32 %r13363, %r11584; | |
mov.u32 %r13364, %r11582; | |
BB12_68: | |
mov.u32 %r187, %r13349; | |
mov.u32 %r186, %r13350; | |
mov.u32 %r185, %r13351; | |
mov.u32 %r184, %r13352; | |
mov.u32 %r183, %r13353; | |
mov.u32 %r182, %r13354; | |
mov.u32 %r181, %r13355; | |
mov.u32 %r180, %r13356; | |
mov.u32 %r179, %r13357; | |
mov.u32 %r178, %r13358; | |
mov.u32 %r177, %r13359; | |
mov.u32 %r176, %r13360; | |
mov.u32 %r175, %r13361; | |
mov.u32 %r174, %r13362; | |
mov.u32 %r173, %r13363; | |
mov.u32 %r172, %r13364; | |
setp.le.u32 %p37, %r13253, %r187; | |
mov.u32 %r13269, %r187; | |
mov.u32 %r13270, %r186; | |
mov.u32 %r13271, %r185; | |
mov.u32 %r13272, %r184; | |
mov.u32 %r13273, %r183; | |
mov.u32 %r13274, %r182; | |
mov.u32 %r13275, %r181; | |
mov.u32 %r13276, %r180; | |
mov.u32 %r13277, %r179; | |
mov.u32 %r13278, %r178; | |
mov.u32 %r13279, %r177; | |
mov.u32 %r13280, %r176; | |
mov.u32 %r13281, %r175; | |
mov.u32 %r13282, %r174; | |
mov.u32 %r13283, %r173; | |
mov.u32 %r13284, %r172; | |
@%p37 bra BB12_70; | |
st.local.v4.u32 [%rd2], {%r187, %r186, %r185, %r184}; | |
st.local.v4.u32 [%rd2+64], {%r13253, %r13254, %r13255, %r13256}; | |
st.local.v4.u32 [%rd2+16], {%r183, %r182, %r181, %r180}; | |
st.local.v4.u32 [%rd2+80], {%r13257, %r13258, %r13259, %r13260}; | |
st.local.v4.u32 [%rd2+32], {%r179, %r178, %r177, %r176}; | |
st.local.v4.u32 [%rd2+96], {%r13261, %r13262, %r13263, %r13264}; | |
st.local.v4.u32 [%rd2+48], {%r175, %r174, %r173, %r172}; | |
st.local.v4.u32 [%rd2+112], {%r13265, %r13266, %r13267, %r13268}; | |
mov.u32 %r11510, %r13268; | |
mov.u32 %r11512, %r13267; | |
mov.u32 %r11514, %r13266; | |
mov.u32 %r11516, %r13265; | |
mov.u32 %r11518, %r13264; | |
mov.u32 %r11520, %r13263; | |
mov.u32 %r11522, %r13262; | |
mov.u32 %r11524, %r13261; | |
mov.u32 %r11526, %r13260; | |
mov.u32 %r11528, %r13259; | |
mov.u32 %r11530, %r13258; | |
mov.u32 %r11532, %r13257; | |
mov.u32 %r11534, %r13256; | |
mov.u32 %r11536, %r13255; | |
mov.u32 %r11538, %r13254; | |
mov.u32 %r11540, %r13253; | |
mov.u32 %r13268, %r172; | |
mov.u32 %r13267, %r173; | |
mov.u32 %r13266, %r174; | |
mov.u32 %r13265, %r175; | |
mov.u32 %r13264, %r176; | |
mov.u32 %r13263, %r177; | |
mov.u32 %r13262, %r178; | |
mov.u32 %r13261, %r179; | |
mov.u32 %r13260, %r180; | |
mov.u32 %r13259, %r181; | |
mov.u32 %r13258, %r182; | |
mov.u32 %r13257, %r183; | |
mov.u32 %r13256, %r184; | |
mov.u32 %r13255, %r185; | |
mov.u32 %r13254, %r186; | |
mov.u32 %r13253, %r187; | |
mov.u32 %r13269, %r11540; | |
mov.u32 %r13270, %r11538; | |
mov.u32 %r13271, %r11536; | |
mov.u32 %r13272, %r11534; | |
mov.u32 %r13273, %r11532; | |
mov.u32 %r13274, %r11530; | |
mov.u32 %r13275, %r11528; | |
mov.u32 %r13276, %r11526; | |
mov.u32 %r13277, %r11524; | |
mov.u32 %r13278, %r11522; | |
mov.u32 %r13279, %r11520; | |
mov.u32 %r13280, %r11518; | |
mov.u32 %r13281, %r11516; | |
mov.u32 %r13282, %r11514; | |
mov.u32 %r13283, %r11512; | |
mov.u32 %r13284, %r11510; | |
BB12_70: | |
mov.u32 %r13189, %r13253; | |
mov.u32 %r13190, %r13254; | |
mov.u32 %r13191, %r13255; | |
mov.u32 %r13192, %r13256; | |
mov.u32 %r13193, %r13257; | |
mov.u32 %r13194, %r13258; | |
mov.u32 %r13195, %r13259; | |
mov.u32 %r13196, %r13260; | |
mov.u32 %r13197, %r13261; | |
mov.u32 %r13198, %r13262; | |
mov.u32 %r13199, %r13263; | |
mov.u32 %r13200, %r13264; | |
mov.u32 %r13201, %r13265; | |
mov.u32 %r13202, %r13266; | |
mov.u32 %r13203, %r13267; | |
mov.u32 %r13204, %r13268; | |
mov.u32 %r13205, %r13269; | |
mov.u32 %r13206, %r13270; | |
mov.u32 %r13207, %r13271; | |
mov.u32 %r13208, %r13272; | |
mov.u32 %r13209, %r13273; | |
mov.u32 %r13210, %r13274; | |
mov.u32 %r13211, %r13275; | |
mov.u32 %r13212, %r13276; | |
mov.u32 %r13213, %r13277; | |
mov.u32 %r13214, %r13278; | |
mov.u32 %r13215, %r13279; | |
mov.u32 %r13216, %r13280; | |
mov.u32 %r13217, %r13281; | |
mov.u32 %r13218, %r13282; | |
mov.u32 %r13219, %r13283; | |
mov.u32 %r13220, %r13284; | |
mul.lo.s64 %rd681, %rd16, 1792; | |
add.s64 %rd682, %rd6, %rd681; | |
bfe.u32 %r5484, %r12, 22, 6; | |
mul.wide.u32 %rd683, %r5484, 28; | |
add.s64 %rd684, %rd682, %rd683; | |
ld.global.u32 %r220, [%rd684+-4]; | |
and.b32 %r5485, %r220, 65535; | |
mul.wide.u32 %rd685, %r5485, 1792; | |
add.s64 %rd686, %rd4, %rd685; | |
bfe.u32 %r5486, %r220, 16, 6; | |
mul.wide.u32 %rd687, %r5486, 28; | |
add.s64 %rd688, %rd686, %rd687; | |
ld.global.u32 %r221, [%rd688+-8]; | |
and.b32 %r5487, %r221, 65535; | |
mul.wide.u32 %rd689, %r5487, 1792; | |
add.s64 %rd690, %rd6, %rd689; | |
bfe.u32 %r5488, %r221, 16, 6; | |
mul.wide.u32 %rd691, %r5488, 28; | |
add.s64 %rd692, %rd690, %rd691; | |
ld.global.u32 %r222, [%rd692+-8]; | |
and.b32 %r5489, %r222, 65535; | |
mul.wide.u32 %rd693, %r5489, 1792; | |
add.s64 %rd694, %rd4, %rd693; | |
cvt.u64.u32 %rd33, %r5485; | |
cvt.u64.u32 %rd34, %r5487; | |
cvt.u64.u32 %rd35, %r5489; | |
bfe.u32 %r5490, %r222, 16, 6; | |
mul.wide.u32 %rd695, %r5490, 28; | |
add.s64 %rd696, %rd694, %rd695; | |
ld.global.u32 %r223, [%rd696+-12]; | |
and.b32 %r5491, %r223, 65535; | |
cvt.u64.u32 %rd36, %r5491; | |
bfe.u32 %r5492, %r223, 16, 6; | |
mul.wide.u32 %rd697, %r5491, 1792; | |
add.s64 %rd698, %rd415, %rd697; | |
mul.wide.u32 %rd699, %r5492, 28; | |
add.s64 %rd700, %rd698, %rd699; | |
ld.global.u32 %r5493, [%rd700]; | |
and.b32 %r5494, %r5493, 65535; | |
bfe.u32 %r5495, %r5493, 16, 6; | |
mul.wide.u32 %rd701, %r5494, 1792; | |
add.s64 %rd702, %rd414, %rd701; | |
mul.wide.u32 %rd703, %r5495, 28; | |
add.s64 %rd704, %rd702, %rd703; | |
ld.global.u32 %r5496, [%rd704]; | |
and.b32 %r5497, %r5496, 65535; | |
shl.b32 %r5498, %r5497, 6; | |
bfe.u32 %r5499, %r5496, 16, 6; | |
or.b32 %r224, %r5498, %r5499; | |
st.local.u32 [%rd2+128], %r224; | |
bfe.u32 %r5500, %r5493, 22, 6; | |
mul.wide.u32 %rd705, %r5500, 28; | |
add.s64 %rd706, %rd702, %rd705; | |
ld.global.u32 %r5501, [%rd706]; | |
and.b32 %r5502, %r5501, 65535; | |
shl.b32 %r5503, %r5502, 6; | |
bfe.u32 %r5504, %r5501, 16, 6; | |
or.b32 %r13474, %r5503, %r5504; | |
st.local.u32 [%rd2+132], %r13474; | |
setp.le.u32 %p38, %r224, %r13474; | |
mov.u32 %r13473, %r224; | |
@%p38 bra BB12_72; | |
st.local.v2.u32 [%rd2+128], {%r13474, %r224}; | |
mov.u32 %r11749, %r13474; | |
mov.u32 %r13474, %r224; | |
mov.u32 %r13473, %r11749; | |
BB12_72: | |
mov.u32 %r13469, %r13473; | |
mov.u32 %r13470, %r13474; | |
bfe.u32 %r5505, %r223, 22, 6; | |
mul.lo.s64 %rd707, %rd36, 1792; | |
add.s64 %rd708, %rd415, %rd707; | |
mul.wide.u32 %rd709, %r5505, 28; | |
add.s64 %rd710, %rd708, %rd709; | |
ld.global.u32 %r5506, [%rd710]; | |
and.b32 %r5507, %r5506, 65535; | |
bfe.u32 %r5508, %r5506, 16, 6; | |
mul.wide.u32 %rd711, %r5507, 1792; | |
add.s64 %rd712, %rd414, %rd711; | |
mul.wide.u32 %rd713, %r5508, 28; | |
add.s64 %rd714, %rd712, %rd713; | |
ld.global.u32 %r5509, [%rd714]; | |
and.b32 %r5510, %r5509, 65535; | |
shl.b32 %r5511, %r5510, 6; | |
bfe.u32 %r5512, %r5509, 16, 6; | |
or.b32 %r228, %r5511, %r5512; | |
st.local.u32 [%rd2+136], %r228; | |
bfe.u32 %r5513, %r5506, 22, 6; | |
mul.wide.u32 %rd715, %r5513, 28; | |
add.s64 %rd716, %rd712, %rd715; | |
ld.global.u32 %r5514, [%rd716]; | |
and.b32 %r5515, %r5514, 65535; | |
shl.b32 %r5516, %r5515, 6; | |
bfe.u32 %r5517, %r5514, 16, 6; | |
or.b32 %r13476, %r5516, %r5517; | |
st.local.u32 [%rd2+140], %r13476; | |
setp.le.u32 %p39, %r228, %r13476; | |
mov.u32 %r13475, %r228; | |
@%p39 bra BB12_74; | |
st.local.v2.u32 [%rd2+136], {%r13476, %r228}; | |
mov.u32 %r11755, %r13476; | |
mov.u32 %r13476, %r228; | |
mov.u32 %r13475, %r11755; | |
BB12_74: | |
mov.u32 %r231, %r13475; | |
mov.u32 %r230, %r13476; | |
setp.le.u32 %p40, %r13469, %r231; | |
mov.u32 %r13471, %r231; | |
mov.u32 %r13472, %r230; | |
@%p40 bra BB12_76; | |
st.local.v4.u32 [%rd2+128], {%r231, %r230, %r13469, %r13470}; | |
mov.u32 %r11752, %r13470; | |
mov.u32 %r11754, %r13469; | |
mov.u32 %r13470, %r230; | |
mov.u32 %r13469, %r231; | |
mov.u32 %r13471, %r11754; | |
mov.u32 %r13472, %r11752; | |
BB12_76: | |
mov.u32 %r13461, %r13469; | |
mov.u32 %r13462, %r13470; | |
mov.u32 %r13463, %r13471; | |
mov.u32 %r13464, %r13472; | |
mul.lo.s64 %rd717, %rd35, 1792; | |
add.s64 %rd718, %rd4, %rd717; | |
bfe.u32 %r5518, %r222, 22, 6; | |
mul.wide.u32 %rd719, %r5518, 28; | |
add.s64 %rd720, %rd718, %rd719; | |
ld.global.u32 %r236, [%rd720+-12]; | |
and.b32 %r5519, %r236, 65535; | |
cvt.u64.u32 %rd37, %r5519; | |
bfe.u32 %r5520, %r236, 16, 6; | |
mul.wide.u32 %rd721, %r5519, 1792; | |
add.s64 %rd722, %rd415, %rd721; | |
mul.wide.u32 %rd723, %r5520, 28; | |
add.s64 %rd724, %rd722, %rd723; | |
ld.global.u32 %r5521, [%rd724]; | |
and.b32 %r5522, %r5521, 65535; | |
bfe.u32 %r5523, %r5521, 16, 6; | |
mul.wide.u32 %rd725, %r5522, 1792; | |
add.s64 %rd726, %rd414, %rd725; | |
mul.wide.u32 %rd727, %r5523, 28; | |
add.s64 %rd728, %rd726, %rd727; | |
ld.global.u32 %r5524, [%rd728]; | |
and.b32 %r5525, %r5524, 65535; | |
shl.b32 %r5526, %r5525, 6; | |
bfe.u32 %r5527, %r5524, 16, 6; | |
or.b32 %r237, %r5526, %r5527; | |
st.local.u32 [%rd2+144], %r237; | |
bfe.u32 %r5528, %r5521, 22, 6; | |
mul.wide.u32 %rd729, %r5528, 28; | |
add.s64 %rd730, %rd726, %rd729; | |
ld.global.u32 %r5529, [%rd730]; | |
and.b32 %r5530, %r5529, 65535; | |
shl.b32 %r5531, %r5530, 6; | |
bfe.u32 %r5532, %r5529, 16, 6; | |
or.b32 %r13482, %r5531, %r5532; | |
st.local.u32 [%rd2+148], %r13482; | |
setp.le.u32 %p41, %r237, %r13482; | |
mov.u32 %r13481, %r237; | |
@%p41 bra BB12_78; | |
st.local.v2.u32 [%rd2+144], {%r13482, %r237}; | |
mov.u32 %r11769, %r13482; | |
mov.u32 %r13482, %r237; | |
mov.u32 %r13481, %r11769; | |
BB12_78: | |
mov.u32 %r13477, %r13481; | |
mov.u32 %r13478, %r13482; | |
bfe.u32 %r5533, %r236, 22, 6; | |
mul.lo.s64 %rd731, %rd37, 1792; | |
add.s64 %rd732, %rd415, %rd731; | |
mul.wide.u32 %rd733, %r5533, 28; | |
add.s64 %rd734, %rd732, %rd733; | |
ld.global.u32 %r5534, [%rd734]; | |
and.b32 %r5535, %r5534, 65535; | |
bfe.u32 %r5536, %r5534, 16, 6; | |
mul.wide.u32 %rd735, %r5535, 1792; | |
add.s64 %rd736, %rd414, %rd735; | |
mul.wide.u32 %rd737, %r5536, 28; | |
add.s64 %rd738, %rd736, %rd737; | |
ld.global.u32 %r5537, [%rd738]; | |
and.b32 %r5538, %r5537, 65535; | |
shl.b32 %r5539, %r5538, 6; | |
bfe.u32 %r5540, %r5537, 16, 6; | |
or.b32 %r241, %r5539, %r5540; | |
st.local.u32 [%rd2+152], %r241; | |
bfe.u32 %r5541, %r5534, 22, 6; | |
mul.wide.u32 %rd739, %r5541, 28; | |
add.s64 %rd740, %rd736, %rd739; | |
ld.global.u32 %r5542, [%rd740]; | |
and.b32 %r5543, %r5542, 65535; | |
shl.b32 %r5544, %r5543, 6; | |
bfe.u32 %r5545, %r5542, 16, 6; | |
or.b32 %r13484, %r5544, %r5545; | |
st.local.u32 [%rd2+156], %r13484; | |
setp.le.u32 %p42, %r241, %r13484; | |
mov.u32 %r13483, %r241; | |
@%p42 bra BB12_80; | |
st.local.v2.u32 [%rd2+152], {%r13484, %r241}; | |
mov.u32 %r11775, %r13484; | |
mov.u32 %r13484, %r241; | |
mov.u32 %r13483, %r11775; | |
BB12_80: | |
mov.u32 %r244, %r13483; | |
mov.u32 %r243, %r13484; | |
setp.le.u32 %p43, %r13477, %r244; | |
mov.u32 %r13479, %r244; | |
mov.u32 %r13480, %r243; | |
@%p43 bra BB12_82; | |
st.local.v4.u32 [%rd2+144], {%r244, %r243, %r13477, %r13478}; | |
mov.u32 %r11772, %r13478; | |
mov.u32 %r11774, %r13477; | |
mov.u32 %r13478, %r243; | |
mov.u32 %r13477, %r244; | |
mov.u32 %r13479, %r11774; | |
mov.u32 %r13480, %r11772; | |
BB12_82: | |
mov.u32 %r248, %r13477; | |
mov.u32 %r247, %r13478; | |
mov.u32 %r246, %r13479; | |
mov.u32 %r245, %r13480; | |
setp.le.u32 %p44, %r13461, %r248; | |
mov.u32 %r13465, %r248; | |
mov.u32 %r13466, %r247; | |
mov.u32 %r13467, %r246; | |
mov.u32 %r13468, %r245; | |
@%p44 bra BB12_84; | |
st.local.v4.u32 [%rd2+128], {%r248, %r247, %r246, %r245}; | |
st.local.v4.u32 [%rd2+144], {%r13461, %r13462, %r13463, %r13464}; | |
mov.u32 %r11762, %r13464; | |
mov.u32 %r11764, %r13463; | |
mov.u32 %r11766, %r13462; | |
mov.u32 %r11768, %r13461; | |
mov.u32 %r13464, %r245; | |
mov.u32 %r13463, %r246; | |
mov.u32 %r13462, %r247; | |
mov.u32 %r13461, %r248; | |
mov.u32 %r13465, %r11768; | |
mov.u32 %r13466, %r11766; | |
mov.u32 %r13467, %r11764; | |
mov.u32 %r13468, %r11762; | |
BB12_84: | |
mov.u32 %r13445, %r13461; | |
mov.u32 %r13446, %r13462; | |
mov.u32 %r13447, %r13463; | |
mov.u32 %r13448, %r13464; | |
mov.u32 %r13449, %r13465; | |
mov.u32 %r13450, %r13466; | |
mov.u32 %r13451, %r13467; | |
mov.u32 %r13452, %r13468; | |
mul.lo.s64 %rd741, %rd34, 1792; | |
add.s64 %rd742, %rd6, %rd741; | |
bfe.u32 %r5546, %r221, 22, 6; | |
mul.wide.u32 %rd743, %r5546, 28; | |
add.s64 %rd744, %rd742, %rd743; | |
ld.global.u32 %r257, [%rd744+-8]; | |
and.b32 %r5547, %r257, 65535; | |
mul.wide.u32 %rd745, %r5547, 1792; | |
add.s64 %rd746, %rd4, %rd745; | |
cvt.u64.u32 %rd38, %r5547; | |
bfe.u32 %r5548, %r257, 16, 6; | |
mul.wide.u32 %rd747, %r5548, 28; | |
add.s64 %rd748, %rd746, %rd747; | |
ld.global.u32 %r258, [%rd748+-12]; | |
and.b32 %r5549, %r258, 65535; | |
cvt.u64.u32 %rd39, %r5549; | |
bfe.u32 %r5550, %r258, 16, 6; | |
mul.wide.u32 %rd749, %r5549, 1792; | |
add.s64 %rd750, %rd415, %rd749; | |
mul.wide.u32 %rd751, %r5550, 28; | |
add.s64 %rd752, %rd750, %rd751; | |
ld.global.u32 %r5551, [%rd752]; | |
and.b32 %r5552, %r5551, 65535; | |
bfe.u32 %r5553, %r5551, 16, 6; | |
mul.wide.u32 %rd753, %r5552, 1792; | |
add.s64 %rd754, %rd414, %rd753; | |
mul.wide.u32 %rd755, %r5553, 28; | |
add.s64 %rd756, %rd754, %rd755; | |
ld.global.u32 %r5554, [%rd756]; | |
and.b32 %r5555, %r5554, 65535; | |
shl.b32 %r5556, %r5555, 6; | |
bfe.u32 %r5557, %r5554, 16, 6; | |
or.b32 %r259, %r5556, %r5557; | |
st.local.u32 [%rd2+160], %r259; | |
bfe.u32 %r5558, %r5551, 22, 6; | |
mul.wide.u32 %rd757, %r5558, 28; | |
add.s64 %rd758, %rd754, %rd757; | |
ld.global.u32 %r5559, [%rd758]; | |
and.b32 %r5560, %r5559, 65535; | |
shl.b32 %r5561, %r5560, 6; | |
bfe.u32 %r5562, %r5559, 16, 6; | |
or.b32 %r13498, %r5561, %r5562; | |
st.local.u32 [%rd2+164], %r13498; | |
setp.le.u32 %p45, %r259, %r13498; | |
mov.u32 %r13497, %r259; | |
@%p45 bra BB12_86; | |
st.local.v2.u32 [%rd2+160], {%r13498, %r259}; | |
mov.u32 %r11805, %r13498; | |
mov.u32 %r13498, %r259; | |
mov.u32 %r13497, %r11805; | |
BB12_86: | |
mov.u32 %r13493, %r13497; | |
mov.u32 %r13494, %r13498; | |
bfe.u32 %r5563, %r258, 22, 6; | |
mul.lo.s64 %rd759, %rd39, 1792; | |
add.s64 %rd760, %rd415, %rd759; | |
mul.wide.u32 %rd761, %r5563, 28; | |
add.s64 %rd762, %rd760, %rd761; | |
ld.global.u32 %r5564, [%rd762]; | |
and.b32 %r5565, %r5564, 65535; | |
bfe.u32 %r5566, %r5564, 16, 6; | |
mul.wide.u32 %rd763, %r5565, 1792; | |
add.s64 %rd764, %rd414, %rd763; | |
mul.wide.u32 %rd765, %r5566, 28; | |
add.s64 %rd766, %rd764, %rd765; | |
ld.global.u32 %r5567, [%rd766]; | |
and.b32 %r5568, %r5567, 65535; | |
shl.b32 %r5569, %r5568, 6; | |
bfe.u32 %r5570, %r5567, 16, 6; | |
or.b32 %r263, %r5569, %r5570; | |
st.local.u32 [%rd2+168], %r263; | |
bfe.u32 %r5571, %r5564, 22, 6; | |
mul.wide.u32 %rd767, %r5571, 28; | |
add.s64 %rd768, %rd764, %rd767; | |
ld.global.u32 %r5572, [%rd768]; | |
and.b32 %r5573, %r5572, 65535; | |
shl.b32 %r5574, %r5573, 6; | |
bfe.u32 %r5575, %r5572, 16, 6; | |
or.b32 %r13500, %r5574, %r5575; | |
st.local.u32 [%rd2+172], %r13500; | |
setp.le.u32 %p46, %r263, %r13500; | |
mov.u32 %r13499, %r263; | |
@%p46 bra BB12_88; | |
st.local.v2.u32 [%rd2+168], {%r13500, %r263}; | |
mov.u32 %r11811, %r13500; | |
mov.u32 %r13500, %r263; | |
mov.u32 %r13499, %r11811; | |
BB12_88: | |
mov.u32 %r266, %r13499; | |
mov.u32 %r265, %r13500; | |
setp.le.u32 %p47, %r13493, %r266; | |
mov.u32 %r13495, %r266; | |
mov.u32 %r13496, %r265; | |
@%p47 bra BB12_90; | |
st.local.v4.u32 [%rd2+160], {%r266, %r265, %r13493, %r13494}; | |
mov.u32 %r11808, %r13494; | |
mov.u32 %r11810, %r13493; | |
mov.u32 %r13494, %r265; | |
mov.u32 %r13493, %r266; | |
mov.u32 %r13495, %r11810; | |
mov.u32 %r13496, %r11808; | |
BB12_90: | |
mov.u32 %r13485, %r13493; | |
mov.u32 %r13486, %r13494; | |
mov.u32 %r13487, %r13495; | |
mov.u32 %r13488, %r13496; | |
mul.lo.s64 %rd769, %rd38, 1792; | |
add.s64 %rd770, %rd4, %rd769; | |
bfe.u32 %r5576, %r257, 22, 6; | |
mul.wide.u32 %rd771, %r5576, 28; | |
add.s64 %rd772, %rd770, %rd771; | |
ld.global.u32 %r271, [%rd772+-12]; | |
and.b32 %r5577, %r271, 65535; | |
cvt.u64.u32 %rd40, %r5577; | |
bfe.u32 %r5578, %r271, 16, 6; | |
mul.wide.u32 %rd773, %r5577, 1792; | |
add.s64 %rd774, %rd415, %rd773; | |
mul.wide.u32 %rd775, %r5578, 28; | |
add.s64 %rd776, %rd774, %rd775; | |
ld.global.u32 %r5579, [%rd776]; | |
and.b32 %r5580, %r5579, 65535; | |
bfe.u32 %r5581, %r5579, 16, 6; | |
mul.wide.u32 %rd777, %r5580, 1792; | |
add.s64 %rd778, %rd414, %rd777; | |
mul.wide.u32 %rd779, %r5581, 28; | |
add.s64 %rd780, %rd778, %rd779; | |
ld.global.u32 %r5582, [%rd780]; | |
and.b32 %r5583, %r5582, 65535; | |
shl.b32 %r5584, %r5583, 6; | |
bfe.u32 %r5585, %r5582, 16, 6; | |
or.b32 %r272, %r5584, %r5585; | |
st.local.u32 [%rd2+176], %r272; | |
bfe.u32 %r5586, %r5579, 22, 6; | |
mul.wide.u32 %rd781, %r5586, 28; | |
add.s64 %rd782, %rd778, %rd781; | |
ld.global.u32 %r5587, [%rd782]; | |
and.b32 %r5588, %r5587, 65535; | |
shl.b32 %r5589, %r5588, 6; | |
bfe.u32 %r5590, %r5587, 16, 6; | |
or.b32 %r13506, %r5589, %r5590; | |
st.local.u32 [%rd2+180], %r13506; | |
setp.le.u32 %p48, %r272, %r13506; | |
mov.u32 %r13505, %r272; | |
@%p48 bra BB12_92; | |
st.local.v2.u32 [%rd2+176], {%r13506, %r272}; | |
mov.u32 %r11825, %r13506; | |
mov.u32 %r13506, %r272; | |
mov.u32 %r13505, %r11825; | |
BB12_92: | |
mov.u32 %r13501, %r13505; | |
mov.u32 %r13502, %r13506; | |
bfe.u32 %r5591, %r271, 22, 6; | |
mul.lo.s64 %rd783, %rd40, 1792; | |
add.s64 %rd784, %rd415, %rd783; | |
mul.wide.u32 %rd785, %r5591, 28; | |
add.s64 %rd786, %rd784, %rd785; | |
ld.global.u32 %r5592, [%rd786]; | |
and.b32 %r5593, %r5592, 65535; | |
bfe.u32 %r5594, %r5592, 16, 6; | |
mul.wide.u32 %rd787, %r5593, 1792; | |
add.s64 %rd788, %rd414, %rd787; | |
mul.wide.u32 %rd789, %r5594, 28; | |
add.s64 %rd790, %rd788, %rd789; | |
ld.global.u32 %r5595, [%rd790]; | |
and.b32 %r5596, %r5595, 65535; | |
shl.b32 %r5597, %r5596, 6; | |
bfe.u32 %r5598, %r5595, 16, 6; | |
or.b32 %r276, %r5597, %r5598; | |
st.local.u32 [%rd2+184], %r276; | |
bfe.u32 %r5599, %r5592, 22, 6; | |
mul.wide.u32 %rd791, %r5599, 28; | |
add.s64 %rd792, %rd788, %rd791; | |
ld.global.u32 %r5600, [%rd792]; | |
and.b32 %r5601, %r5600, 65535; | |
shl.b32 %r5602, %r5601, 6; | |
bfe.u32 %r5603, %r5600, 16, 6; | |
or.b32 %r13508, %r5602, %r5603; | |
st.local.u32 [%rd2+188], %r13508; | |
setp.le.u32 %p49, %r276, %r13508; | |
mov.u32 %r13507, %r276; | |
@%p49 bra BB12_94; | |
st.local.v2.u32 [%rd2+184], {%r13508, %r276}; | |
mov.u32 %r11831, %r13508; | |
mov.u32 %r13508, %r276; | |
mov.u32 %r13507, %r11831; | |
BB12_94: | |
mov.u32 %r279, %r13507; | |
mov.u32 %r278, %r13508; | |
setp.le.u32 %p50, %r13501, %r279; | |
mov.u32 %r13503, %r279; | |
mov.u32 %r13504, %r278; | |
@%p50 bra BB12_96; | |
st.local.v4.u32 [%rd2+176], {%r279, %r278, %r13501, %r13502}; | |
mov.u32 %r11828, %r13502; | |
mov.u32 %r11830, %r13501; | |
mov.u32 %r13502, %r278; | |
mov.u32 %r13501, %r279; | |
mov.u32 %r13503, %r11830; | |
mov.u32 %r13504, %r11828; | |
BB12_96: | |
mov.u32 %r283, %r13501; | |
mov.u32 %r282, %r13502; | |
mov.u32 %r281, %r13503; | |
mov.u32 %r280, %r13504; | |
setp.le.u32 %p51, %r13485, %r283; | |
mov.u32 %r13489, %r283; | |
mov.u32 %r13490, %r282; | |
mov.u32 %r13491, %r281; | |
mov.u32 %r13492, %r280; | |
@%p51 bra BB12_98; | |
st.local.v4.u32 [%rd2+160], {%r283, %r282, %r281, %r280}; | |
st.local.v4.u32 [%rd2+176], {%r13485, %r13486, %r13487, %r13488}; | |
mov.u32 %r11818, %r13488; | |
mov.u32 %r11820, %r13487; | |
mov.u32 %r11822, %r13486; | |
mov.u32 %r11824, %r13485; | |
mov.u32 %r13488, %r280; | |
mov.u32 %r13487, %r281; | |
mov.u32 %r13486, %r282; | |
mov.u32 %r13485, %r283; | |
mov.u32 %r13489, %r11824; | |
mov.u32 %r13490, %r11822; | |
mov.u32 %r13491, %r11820; | |
mov.u32 %r13492, %r11818; | |
BB12_98: | |
mov.u32 %r291, %r13485; | |
mov.u32 %r290, %r13486; | |
mov.u32 %r289, %r13487; | |
mov.u32 %r288, %r13488; | |
mov.u32 %r287, %r13489; | |
mov.u32 %r286, %r13490; | |
mov.u32 %r285, %r13491; | |
mov.u32 %r284, %r13492; | |
setp.le.u32 %p52, %r13445, %r291; | |
mov.u32 %r13453, %r291; | |
mov.u32 %r13454, %r290; | |
mov.u32 %r13455, %r289; | |
mov.u32 %r13456, %r288; | |
mov.u32 %r13457, %r287; | |
mov.u32 %r13458, %r286; | |
mov.u32 %r13459, %r285; | |
mov.u32 %r13460, %r284; | |
@%p52 bra BB12_100; | |
st.local.v4.u32 [%rd2+128], {%r291, %r290, %r289, %r288}; | |
st.local.v4.u32 [%rd2+160], {%r13445, %r13446, %r13447, %r13448}; | |
st.local.v4.u32 [%rd2+144], {%r287, %r286, %r285, %r284}; | |
st.local.v4.u32 [%rd2+176], {%r13449, %r13450, %r13451, %r13452}; | |
mov.u32 %r11790, %r13452; | |
mov.u32 %r11792, %r13451; | |
mov.u32 %r11794, %r13450; | |
mov.u32 %r11796, %r13449; | |
mov.u32 %r11798, %r13448; | |
mov.u32 %r11800, %r13447; | |
mov.u32 %r11802, %r13446; | |
mov.u32 %r11804, %r13445; | |
mov.u32 %r13452, %r284; | |
mov.u32 %r13451, %r285; | |
mov.u32 %r13450, %r286; | |
mov.u32 %r13449, %r287; | |
mov.u32 %r13448, %r288; | |
mov.u32 %r13447, %r289; | |
mov.u32 %r13446, %r290; | |
mov.u32 %r13445, %r291; | |
mov.u32 %r13453, %r11804; | |
mov.u32 %r13454, %r11802; | |
mov.u32 %r13455, %r11800; | |
mov.u32 %r13456, %r11798; | |
mov.u32 %r13457, %r11796; | |
mov.u32 %r13458, %r11794; | |
mov.u32 %r13459, %r11792; | |
mov.u32 %r13460, %r11790; | |
BB12_100: | |
mov.u32 %r13413, %r13445; | |
mov.u32 %r13414, %r13446; | |
mov.u32 %r13415, %r13447; | |
mov.u32 %r13416, %r13448; | |
mov.u32 %r13417, %r13449; | |
mov.u32 %r13418, %r13450; | |
mov.u32 %r13419, %r13451; | |
mov.u32 %r13420, %r13452; | |
mov.u32 %r13421, %r13453; | |
mov.u32 %r13422, %r13454; | |
mov.u32 %r13423, %r13455; | |
mov.u32 %r13424, %r13456; | |
mov.u32 %r13425, %r13457; | |
mov.u32 %r13426, %r13458; | |
mov.u32 %r13427, %r13459; | |
mov.u32 %r13428, %r13460; | |
mul.lo.s64 %rd793, %rd33, 1792; | |
add.s64 %rd794, %rd4, %rd793; | |
bfe.u32 %r5604, %r220, 22, 6; | |
mul.wide.u32 %rd795, %r5604, 28; | |
add.s64 %rd796, %rd794, %rd795; | |
ld.global.u32 %r308, [%rd796+-8]; | |
and.b32 %r5605, %r308, 65535; | |
mul.wide.u32 %rd797, %r5605, 1792; | |
add.s64 %rd798, %rd6, %rd797; | |
bfe.u32 %r5606, %r308, 16, 6; | |
mul.wide.u32 %rd799, %r5606, 28; | |
add.s64 %rd800, %rd798, %rd799; | |
ld.global.u32 %r309, [%rd800+-8]; | |
and.b32 %r5607, %r309, 65535; | |
mul.wide.u32 %rd801, %r5607, 1792; | |
add.s64 %rd802, %rd4, %rd801; | |
cvt.u64.u32 %rd41, %r5605; | |
cvt.u64.u32 %rd42, %r5607; | |
bfe.u32 %r5608, %r309, 16, 6; | |
mul.wide.u32 %rd803, %r5608, 28; | |
add.s64 %rd804, %rd802, %rd803; | |
ld.global.u32 %r310, [%rd804+-12]; | |
and.b32 %r5609, %r310, 65535; | |
cvt.u64.u32 %rd43, %r5609; | |
bfe.u32 %r5610, %r310, 16, 6; | |
mul.wide.u32 %rd805, %r5609, 1792; | |
add.s64 %rd806, %rd415, %rd805; | |
mul.wide.u32 %rd807, %r5610, 28; | |
add.s64 %rd808, %rd806, %rd807; | |
ld.global.u32 %r5611, [%rd808]; | |
and.b32 %r5612, %r5611, 65535; | |
bfe.u32 %r5613, %r5611, 16, 6; | |
mul.wide.u32 %rd809, %r5612, 1792; | |
add.s64 %rd810, %rd414, %rd809; | |
mul.wide.u32 %rd811, %r5613, 28; | |
add.s64 %rd812, %rd810, %rd811; | |
ld.global.u32 %r5614, [%rd812]; | |
and.b32 %r5615, %r5614, 65535; | |
shl.b32 %r5616, %r5615, 6; | |
bfe.u32 %r5617, %r5614, 16, 6; | |
or.b32 %r311, %r5616, %r5617; | |
st.local.u32 [%rd2+192], %r311; | |
bfe.u32 %r5618, %r5611, 22, 6; | |
mul.wide.u32 %rd813, %r5618, 28; | |
add.s64 %rd814, %rd810, %rd813; | |
ld.global.u32 %r5619, [%rd814]; | |
and.b32 %r5620, %r5619, 65535; | |
shl.b32 %r5621, %r5620, 6; | |
bfe.u32 %r5622, %r5619, 16, 6; | |
or.b32 %r13538, %r5621, %r5622; | |
st.local.u32 [%rd2+196], %r13538; | |
setp.le.u32 %p53, %r311, %r13538; | |
mov.u32 %r13537, %r311; | |
@%p53 bra BB12_102; | |
st.local.v2.u32 [%rd2+192], {%r13538, %r311}; | |
mov.u32 %r11893, %r13538; | |
mov.u32 %r13538, %r311; | |
mov.u32 %r13537, %r11893; | |
BB12_102: | |
mov.u32 %r13533, %r13537; | |
mov.u32 %r13534, %r13538; | |
bfe.u32 %r5623, %r310, 22, 6; | |
mul.lo.s64 %rd815, %rd43, 1792; | |
add.s64 %rd816, %rd415, %rd815; | |
mul.wide.u32 %rd817, %r5623, 28; | |
add.s64 %rd818, %rd816, %rd817; | |
ld.global.u32 %r5624, [%rd818]; | |
and.b32 %r5625, %r5624, 65535; | |
bfe.u32 %r5626, %r5624, 16, 6; | |
mul.wide.u32 %rd819, %r5625, 1792; | |
add.s64 %rd820, %rd414, %rd819; | |
mul.wide.u32 %rd821, %r5626, 28; | |
add.s64 %rd822, %rd820, %rd821; | |
ld.global.u32 %r5627, [%rd822]; | |
and.b32 %r5628, %r5627, 65535; | |
shl.b32 %r5629, %r5628, 6; | |
bfe.u32 %r5630, %r5627, 16, 6; | |
or.b32 %r315, %r5629, %r5630; | |
st.local.u32 [%rd2+200], %r315; | |
bfe.u32 %r5631, %r5624, 22, 6; | |
mul.wide.u32 %rd823, %r5631, 28; | |
add.s64 %rd824, %rd820, %rd823; | |
ld.global.u32 %r5632, [%rd824]; | |
and.b32 %r5633, %r5632, 65535; | |
shl.b32 %r5634, %r5633, 6; | |
bfe.u32 %r5635, %r5632, 16, 6; | |
or.b32 %r13540, %r5634, %r5635; | |
st.local.u32 [%rd2+204], %r13540; | |
setp.le.u32 %p54, %r315, %r13540; | |
mov.u32 %r13539, %r315; | |
@%p54 bra BB12_104; | |
st.local.v2.u32 [%rd2+200], {%r13540, %r315}; | |
mov.u32 %r11899, %r13540; | |
mov.u32 %r13540, %r315; | |
mov.u32 %r13539, %r11899; | |
BB12_104: | |
mov.u32 %r318, %r13539; | |
mov.u32 %r317, %r13540; | |
setp.le.u32 %p55, %r13533, %r318; | |
mov.u32 %r13535, %r318; | |
mov.u32 %r13536, %r317; | |
@%p55 bra BB12_106; | |
st.local.v4.u32 [%rd2+192], {%r318, %r317, %r13533, %r13534}; | |
mov.u32 %r11896, %r13534; | |
mov.u32 %r11898, %r13533; | |
mov.u32 %r13534, %r317; | |
mov.u32 %r13533, %r318; | |
mov.u32 %r13535, %r11898; | |
mov.u32 %r13536, %r11896; | |
BB12_106: | |
mov.u32 %r13525, %r13533; | |
mov.u32 %r13526, %r13534; | |
mov.u32 %r13527, %r13535; | |
mov.u32 %r13528, %r13536; | |
mul.lo.s64 %rd825, %rd42, 1792; | |
add.s64 %rd826, %rd4, %rd825; | |
bfe.u32 %r5636, %r309, 22, 6; | |
mul.wide.u32 %rd827, %r5636, 28; | |
add.s64 %rd828, %rd826, %rd827; | |
ld.global.u32 %r323, [%rd828+-12]; | |
and.b32 %r5637, %r323, 65535; | |
cvt.u64.u32 %rd44, %r5637; | |
bfe.u32 %r5638, %r323, 16, 6; | |
mul.wide.u32 %rd829, %r5637, 1792; | |
add.s64 %rd830, %rd415, %rd829; | |
mul.wide.u32 %rd831, %r5638, 28; | |
add.s64 %rd832, %rd830, %rd831; | |
ld.global.u32 %r5639, [%rd832]; | |
and.b32 %r5640, %r5639, 65535; | |
bfe.u32 %r5641, %r5639, 16, 6; | |
mul.wide.u32 %rd833, %r5640, 1792; | |
add.s64 %rd834, %rd414, %rd833; | |
mul.wide.u32 %rd835, %r5641, 28; | |
add.s64 %rd836, %rd834, %rd835; | |
ld.global.u32 %r5642, [%rd836]; | |
and.b32 %r5643, %r5642, 65535; | |
shl.b32 %r5644, %r5643, 6; | |
bfe.u32 %r5645, %r5642, 16, 6; | |
or.b32 %r324, %r5644, %r5645; | |
st.local.u32 [%rd2+208], %r324; | |
bfe.u32 %r5646, %r5639, 22, 6; | |
mul.wide.u32 %rd837, %r5646, 28; | |
add.s64 %rd838, %rd834, %rd837; | |
ld.global.u32 %r5647, [%rd838]; | |
and.b32 %r5648, %r5647, 65535; | |
shl.b32 %r5649, %r5648, 6; | |
bfe.u32 %r5650, %r5647, 16, 6; | |
or.b32 %r13546, %r5649, %r5650; | |
st.local.u32 [%rd2+212], %r13546; | |
setp.le.u32 %p56, %r324, %r13546; | |
mov.u32 %r13545, %r324; | |
@%p56 bra BB12_108; | |
st.local.v2.u32 [%rd2+208], {%r13546, %r324}; | |
mov.u32 %r11913, %r13546; | |
mov.u32 %r13546, %r324; | |
mov.u32 %r13545, %r11913; | |
BB12_108: | |
mov.u32 %r13541, %r13545; | |
mov.u32 %r13542, %r13546; | |
bfe.u32 %r5651, %r323, 22, 6; | |
mul.lo.s64 %rd839, %rd44, 1792; | |
add.s64 %rd840, %rd415, %rd839; | |
mul.wide.u32 %rd841, %r5651, 28; | |
add.s64 %rd842, %rd840, %rd841; | |
ld.global.u32 %r5652, [%rd842]; | |
and.b32 %r5653, %r5652, 65535; | |
bfe.u32 %r5654, %r5652, 16, 6; | |
mul.wide.u32 %rd843, %r5653, 1792; | |
add.s64 %rd844, %rd414, %rd843; | |
mul.wide.u32 %rd845, %r5654, 28; | |
add.s64 %rd846, %rd844, %rd845; | |
ld.global.u32 %r5655, [%rd846]; | |
and.b32 %r5656, %r5655, 65535; | |
shl.b32 %r5657, %r5656, 6; | |
bfe.u32 %r5658, %r5655, 16, 6; | |
or.b32 %r328, %r5657, %r5658; | |
st.local.u32 [%rd2+216], %r328; | |
bfe.u32 %r5659, %r5652, 22, 6; | |
mul.wide.u32 %rd847, %r5659, 28; | |
add.s64 %rd848, %rd844, %rd847; | |
ld.global.u32 %r5660, [%rd848]; | |
and.b32 %r5661, %r5660, 65535; | |
shl.b32 %r5662, %r5661, 6; | |
bfe.u32 %r5663, %r5660, 16, 6; | |
or.b32 %r13548, %r5662, %r5663; | |
st.local.u32 [%rd2+220], %r13548; | |
setp.le.u32 %p57, %r328, %r13548; | |
mov.u32 %r13547, %r328; | |
@%p57 bra BB12_110; | |
st.local.v2.u32 [%rd2+216], {%r13548, %r328}; | |
mov.u32 %r11919, %r13548; | |
mov.u32 %r13548, %r328; | |
mov.u32 %r13547, %r11919; | |
BB12_110: | |
mov.u32 %r331, %r13547; | |
mov.u32 %r330, %r13548; | |
setp.le.u32 %p58, %r13541, %r331; | |
mov.u32 %r13543, %r331; | |
mov.u32 %r13544, %r330; | |
@%p58 bra BB12_112; | |
st.local.v4.u32 [%rd2+208], {%r331, %r330, %r13541, %r13542}; | |
mov.u32 %r11916, %r13542; | |
mov.u32 %r11918, %r13541; | |
mov.u32 %r13542, %r330; | |
mov.u32 %r13541, %r331; | |
mov.u32 %r13543, %r11918; | |
mov.u32 %r13544, %r11916; | |
BB12_112: | |
mov.u32 %r335, %r13541; | |
mov.u32 %r334, %r13542; | |
mov.u32 %r333, %r13543; | |
mov.u32 %r332, %r13544; | |
setp.le.u32 %p59, %r13525, %r335; | |
mov.u32 %r13529, %r335; | |
mov.u32 %r13530, %r334; | |
mov.u32 %r13531, %r333; | |
mov.u32 %r13532, %r332; | |
@%p59 bra BB12_114; | |
st.local.v4.u32 [%rd2+192], {%r335, %r334, %r333, %r332}; | |
st.local.v4.u32 [%rd2+208], {%r13525, %r13526, %r13527, %r13528}; | |
mov.u32 %r11906, %r13528; | |
mov.u32 %r11908, %r13527; | |
mov.u32 %r11910, %r13526; | |
mov.u32 %r11912, %r13525; | |
mov.u32 %r13528, %r332; | |
mov.u32 %r13527, %r333; | |
mov.u32 %r13526, %r334; | |
mov.u32 %r13525, %r335; | |
mov.u32 %r13529, %r11912; | |
mov.u32 %r13530, %r11910; | |
mov.u32 %r13531, %r11908; | |
mov.u32 %r13532, %r11906; | |
BB12_114: | |
mov.u32 %r13509, %r13525; | |
mov.u32 %r13510, %r13526; | |
mov.u32 %r13511, %r13527; | |
mov.u32 %r13512, %r13528; | |
mov.u32 %r13513, %r13529; | |
mov.u32 %r13514, %r13530; | |
mov.u32 %r13515, %r13531; | |
mov.u32 %r13516, %r13532; | |
mul.lo.s64 %rd849, %rd41, 1792; | |
add.s64 %rd850, %rd6, %rd849; | |
bfe.u32 %r5664, %r308, 22, 6; | |
mul.wide.u32 %rd851, %r5664, 28; | |
add.s64 %rd852, %rd850, %rd851; | |
ld.global.u32 %r344, [%rd852+-8]; | |
and.b32 %r5665, %r344, 65535; | |
mul.wide.u32 %rd853, %r5665, 1792; | |
add.s64 %rd854, %rd4, %rd853; | |
cvt.u64.u32 %rd45, %r5665; | |
bfe.u32 %r5666, %r344, 16, 6; | |
mul.wide.u32 %rd855, %r5666, 28; | |
add.s64 %rd856, %rd854, %rd855; | |
ld.global.u32 %r345, [%rd856+-12]; | |
and.b32 %r5667, %r345, 65535; | |
cvt.u64.u32 %rd46, %r5667; | |
bfe.u32 %r5668, %r345, 16, 6; | |
mul.wide.u32 %rd857, %r5667, 1792; | |
add.s64 %rd858, %rd415, %rd857; | |
mul.wide.u32 %rd859, %r5668, 28; | |
add.s64 %rd860, %rd858, %rd859; | |
ld.global.u32 %r5669, [%rd860]; | |
and.b32 %r5670, %r5669, 65535; | |
bfe.u32 %r5671, %r5669, 16, 6; | |
mul.wide.u32 %rd861, %r5670, 1792; | |
add.s64 %rd862, %rd414, %rd861; | |
mul.wide.u32 %rd863, %r5671, 28; | |
add.s64 %rd864, %rd862, %rd863; | |
ld.global.u32 %r5672, [%rd864]; | |
and.b32 %r5673, %r5672, 65535; | |
shl.b32 %r5674, %r5673, 6; | |
bfe.u32 %r5675, %r5672, 16, 6; | |
or.b32 %r346, %r5674, %r5675; | |
st.local.u32 [%rd2+224], %r346; | |
bfe.u32 %r5676, %r5669, 22, 6; | |
mul.wide.u32 %rd865, %r5676, 28; | |
add.s64 %rd866, %rd862, %rd865; | |
ld.global.u32 %r5677, [%rd866]; | |
and.b32 %r5678, %r5677, 65535; | |
shl.b32 %r5679, %r5678, 6; | |
bfe.u32 %r5680, %r5677, 16, 6; | |
or.b32 %r13562, %r5679, %r5680; | |
st.local.u32 [%rd2+228], %r13562; | |
setp.le.u32 %p60, %r346, %r13562; | |
mov.u32 %r13561, %r346; | |
@%p60 bra BB12_116; | |
st.local.v2.u32 [%rd2+224], {%r13562, %r346}; | |
mov.u32 %r11949, %r13562; | |
mov.u32 %r13562, %r346; | |
mov.u32 %r13561, %r11949; | |
BB12_116: | |
mov.u32 %r13557, %r13561; | |
mov.u32 %r13558, %r13562; | |
bfe.u32 %r5681, %r345, 22, 6; | |
mul.lo.s64 %rd867, %rd46, 1792; | |
add.s64 %rd868, %rd415, %rd867; | |
mul.wide.u32 %rd869, %r5681, 28; | |
add.s64 %rd870, %rd868, %rd869; | |
ld.global.u32 %r5682, [%rd870]; | |
and.b32 %r5683, %r5682, 65535; | |
bfe.u32 %r5684, %r5682, 16, 6; | |
mul.wide.u32 %rd871, %r5683, 1792; | |
add.s64 %rd872, %rd414, %rd871; | |
mul.wide.u32 %rd873, %r5684, 28; | |
add.s64 %rd874, %rd872, %rd873; | |
ld.global.u32 %r5685, [%rd874]; | |
and.b32 %r5686, %r5685, 65535; | |
shl.b32 %r5687, %r5686, 6; | |
bfe.u32 %r5688, %r5685, 16, 6; | |
or.b32 %r350, %r5687, %r5688; | |
st.local.u32 [%rd2+232], %r350; | |
bfe.u32 %r5689, %r5682, 22, 6; | |
mul.wide.u32 %rd875, %r5689, 28; | |
add.s64 %rd876, %rd872, %rd875; | |
ld.global.u32 %r5690, [%rd876]; | |
and.b32 %r5691, %r5690, 65535; | |
shl.b32 %r5692, %r5691, 6; | |
bfe.u32 %r5693, %r5690, 16, 6; | |
or.b32 %r13564, %r5692, %r5693; | |
st.local.u32 [%rd2+236], %r13564; | |
setp.le.u32 %p61, %r350, %r13564; | |
mov.u32 %r13563, %r350; | |
@%p61 bra BB12_118; | |
st.local.v2.u32 [%rd2+232], {%r13564, %r350}; | |
mov.u32 %r11955, %r13564; | |
mov.u32 %r13564, %r350; | |
mov.u32 %r13563, %r11955; | |
BB12_118: | |
mov.u32 %r353, %r13563; | |
mov.u32 %r352, %r13564; | |
setp.le.u32 %p62, %r13557, %r353; | |
mov.u32 %r13559, %r353; | |
mov.u32 %r13560, %r352; | |
@%p62 bra BB12_120; | |
st.local.v4.u32 [%rd2+224], {%r353, %r352, %r13557, %r13558}; | |
mov.u32 %r11952, %r13558; | |
mov.u32 %r11954, %r13557; | |
mov.u32 %r13558, %r352; | |
mov.u32 %r13557, %r353; | |
mov.u32 %r13559, %r11954; | |
mov.u32 %r13560, %r11952; | |
BB12_120: | |
mov.u32 %r13549, %r13557; | |
mov.u32 %r13550, %r13558; | |
mov.u32 %r13551, %r13559; | |
mov.u32 %r13552, %r13560; | |
mul.lo.s64 %rd877, %rd45, 1792; | |
add.s64 %rd878, %rd4, %rd877; | |
bfe.u32 %r5694, %r344, 22, 6; | |
mul.wide.u32 %rd879, %r5694, 28; | |
add.s64 %rd880, %rd878, %rd879; | |
ld.global.u32 %r358, [%rd880+-12]; | |
and.b32 %r5695, %r358, 65535; | |
cvt.u64.u32 %rd47, %r5695; | |
bfe.u32 %r5696, %r358, 16, 6; | |
mul.wide.u32 %rd881, %r5695, 1792; | |
add.s64 %rd882, %rd415, %rd881; | |
mul.wide.u32 %rd883, %r5696, 28; | |
add.s64 %rd884, %rd882, %rd883; | |
ld.global.u32 %r5697, [%rd884]; | |
and.b32 %r5698, %r5697, 65535; | |
bfe.u32 %r5699, %r5697, 16, 6; | |
mul.wide.u32 %rd885, %r5698, 1792; | |
add.s64 %rd886, %rd414, %rd885; | |
mul.wide.u32 %rd887, %r5699, 28; | |
add.s64 %rd888, %rd886, %rd887; | |
ld.global.u32 %r5700, [%rd888]; | |
and.b32 %r5701, %r5700, 65535; | |
shl.b32 %r5702, %r5701, 6; | |
bfe.u32 %r5703, %r5700, 16, 6; | |
or.b32 %r359, %r5702, %r5703; | |
st.local.u32 [%rd2+240], %r359; | |
bfe.u32 %r5704, %r5697, 22, 6; | |
mul.wide.u32 %rd889, %r5704, 28; | |
add.s64 %rd890, %rd886, %rd889; | |
ld.global.u32 %r5705, [%rd890]; | |
and.b32 %r5706, %r5705, 65535; | |
shl.b32 %r5707, %r5706, 6; | |
bfe.u32 %r5708, %r5705, 16, 6; | |
or.b32 %r13570, %r5707, %r5708; | |
st.local.u32 [%rd2+244], %r13570; | |
setp.le.u32 %p63, %r359, %r13570; | |
mov.u32 %r13569, %r359; | |
@%p63 bra BB12_122; | |
st.local.v2.u32 [%rd2+240], {%r13570, %r359}; | |
mov.u32 %r11969, %r13570; | |
mov.u32 %r13570, %r359; | |
mov.u32 %r13569, %r11969; | |
BB12_122: | |
mov.u32 %r13565, %r13569; | |
mov.u32 %r13566, %r13570; | |
bfe.u32 %r5709, %r358, 22, 6; | |
mul.lo.s64 %rd891, %rd47, 1792; | |
add.s64 %rd892, %rd415, %rd891; | |
mul.wide.u32 %rd893, %r5709, 28; | |
add.s64 %rd894, %rd892, %rd893; | |
ld.global.u32 %r5710, [%rd894]; | |
and.b32 %r5711, %r5710, 65535; | |
bfe.u32 %r5712, %r5710, 16, 6; | |
mul.wide.u32 %rd895, %r5711, 1792; | |
add.s64 %rd896, %rd414, %rd895; | |
mul.wide.u32 %rd897, %r5712, 28; | |
add.s64 %rd898, %rd896, %rd897; | |
ld.global.u32 %r5713, [%rd898]; | |
and.b32 %r5714, %r5713, 65535; | |
shl.b32 %r5715, %r5714, 6; | |
bfe.u32 %r5716, %r5713, 16, 6; | |
or.b32 %r363, %r5715, %r5716; | |
st.local.u32 [%rd2+248], %r363; | |
bfe.u32 %r5717, %r5710, 22, 6; | |
mul.wide.u32 %rd899, %r5717, 28; | |
add.s64 %rd900, %rd896, %rd899; | |
ld.global.u32 %r5718, [%rd900]; | |
and.b32 %r5719, %r5718, 65535; | |
shl.b32 %r5720, %r5719, 6; | |
bfe.u32 %r5721, %r5718, 16, 6; | |
or.b32 %r13572, %r5720, %r5721; | |
st.local.u32 [%rd2+252], %r13572; | |
setp.le.u32 %p64, %r363, %r13572; | |
mov.u32 %r13571, %r363; | |
@%p64 bra BB12_124; | |
st.local.v2.u32 [%rd2+248], {%r13572, %r363}; | |
mov.u32 %r11975, %r13572; | |
mov.u32 %r13572, %r363; | |
mov.u32 %r13571, %r11975; | |
BB12_124: | |
mov.u32 %r366, %r13571; | |
mov.u32 %r365, %r13572; | |
setp.le.u32 %p65, %r13565, %r366; | |
mov.u32 %r13567, %r366; | |
mov.u32 %r13568, %r365; | |
@%p65 bra BB12_126; | |
st.local.v4.u32 [%rd2+240], {%r366, %r365, %r13565, %r13566}; | |
mov.u32 %r11972, %r13566; | |
mov.u32 %r11974, %r13565; | |
mov.u32 %r13566, %r365; | |
mov.u32 %r13565, %r366; | |
mov.u32 %r13567, %r11974; | |
mov.u32 %r13568, %r11972; | |
BB12_126: | |
mov.u32 %r370, %r13565; | |
mov.u32 %r369, %r13566; | |
mov.u32 %r368, %r13567; | |
mov.u32 %r367, %r13568; | |
setp.le.u32 %p66, %r13549, %r370; | |
mov.u32 %r13553, %r370; | |
mov.u32 %r13554, %r369; | |
mov.u32 %r13555, %r368; | |
mov.u32 %r13556, %r367; | |
@%p66 bra BB12_128; | |
st.local.v4.u32 [%rd2+224], {%r370, %r369, %r368, %r367}; | |
st.local.v4.u32 [%rd2+240], {%r13549, %r13550, %r13551, %r13552}; | |
mov.u32 %r11962, %r13552; | |
mov.u32 %r11964, %r13551; | |
mov.u32 %r11966, %r13550; | |
mov.u32 %r11968, %r13549; | |
mov.u32 %r13552, %r367; | |
mov.u32 %r13551, %r368; | |
mov.u32 %r13550, %r369; | |
mov.u32 %r13549, %r370; | |
mov.u32 %r13553, %r11968; | |
mov.u32 %r13554, %r11966; | |
mov.u32 %r13555, %r11964; | |
mov.u32 %r13556, %r11962; | |
BB12_128: | |
mov.u32 %r378, %r13549; | |
mov.u32 %r377, %r13550; | |
mov.u32 %r376, %r13551; | |
mov.u32 %r375, %r13552; | |
mov.u32 %r374, %r13553; | |
mov.u32 %r373, %r13554; | |
mov.u32 %r372, %r13555; | |
mov.u32 %r371, %r13556; | |
setp.le.u32 %p67, %r13509, %r378; | |
mov.u32 %r13517, %r378; | |
mov.u32 %r13518, %r377; | |
mov.u32 %r13519, %r376; | |
mov.u32 %r13520, %r375; | |
mov.u32 %r13521, %r374; | |
mov.u32 %r13522, %r373; | |
mov.u32 %r13523, %r372; | |
mov.u32 %r13524, %r371; | |
@%p67 bra BB12_130; | |
st.local.v4.u32 [%rd2+192], {%r378, %r377, %r376, %r375}; | |
st.local.v4.u32 [%rd2+224], {%r13509, %r13510, %r13511, %r13512}; | |
st.local.v4.u32 [%rd2+208], {%r374, %r373, %r372, %r371}; | |
st.local.v4.u32 [%rd2+240], {%r13513, %r13514, %r13515, %r13516}; | |
mov.u32 %r11934, %r13516; | |
mov.u32 %r11936, %r13515; | |
mov.u32 %r11938, %r13514; | |
mov.u32 %r11940, %r13513; | |
mov.u32 %r11942, %r13512; | |
mov.u32 %r11944, %r13511; | |
mov.u32 %r11946, %r13510; | |
mov.u32 %r11948, %r13509; | |
mov.u32 %r13516, %r371; | |
mov.u32 %r13515, %r372; | |
mov.u32 %r13514, %r373; | |
mov.u32 %r13513, %r374; | |
mov.u32 %r13512, %r375; | |
mov.u32 %r13511, %r376; | |
mov.u32 %r13510, %r377; | |
mov.u32 %r13509, %r378; | |
mov.u32 %r13517, %r11948; | |
mov.u32 %r13518, %r11946; | |
mov.u32 %r13519, %r11944; | |
mov.u32 %r13520, %r11942; | |
mov.u32 %r13521, %r11940; | |
mov.u32 %r13522, %r11938; | |
mov.u32 %r13523, %r11936; | |
mov.u32 %r13524, %r11934; | |
BB12_130: | |
mov.u32 %r394, %r13509; | |
mov.u32 %r393, %r13510; | |
mov.u32 %r392, %r13511; | |
mov.u32 %r391, %r13512; | |
mov.u32 %r390, %r13513; | |
mov.u32 %r389, %r13514; | |
mov.u32 %r388, %r13515; | |
mov.u32 %r387, %r13516; | |
mov.u32 %r386, %r13517; | |
mov.u32 %r385, %r13518; | |
mov.u32 %r384, %r13519; | |
mov.u32 %r383, %r13520; | |
mov.u32 %r382, %r13521; | |
mov.u32 %r381, %r13522; | |
mov.u32 %r380, %r13523; | |
mov.u32 %r379, %r13524; | |
setp.le.u32 %p68, %r13413, %r394; | |
mov.u32 %r13429, %r394; | |
mov.u32 %r13430, %r393; | |
mov.u32 %r13431, %r392; | |
mov.u32 %r13432, %r391; | |
mov.u32 %r13433, %r390; | |
mov.u32 %r13434, %r389; | |
mov.u32 %r13435, %r388; | |
mov.u32 %r13436, %r387; | |
mov.u32 %r13437, %r386; | |
mov.u32 %r13438, %r385; | |
mov.u32 %r13439, %r384; | |
mov.u32 %r13440, %r383; | |
mov.u32 %r13441, %r382; | |
mov.u32 %r13442, %r381; | |
mov.u32 %r13443, %r380; | |
mov.u32 %r13444, %r379; | |
@%p68 bra BB12_132; | |
st.local.v4.u32 [%rd2+128], {%r394, %r393, %r392, %r391}; | |
st.local.v4.u32 [%rd2+192], {%r13413, %r13414, %r13415, %r13416}; | |
st.local.v4.u32 [%rd2+144], {%r390, %r389, %r388, %r387}; | |
st.local.v4.u32 [%rd2+208], {%r13417, %r13418, %r13419, %r13420}; | |
st.local.v4.u32 [%rd2+160], {%r386, %r385, %r384, %r383}; | |
st.local.v4.u32 [%rd2+224], {%r13421, %r13422, %r13423, %r13424}; | |
st.local.v4.u32 [%rd2+176], {%r382, %r381, %r380, %r379}; | |
st.local.v4.u32 [%rd2+240], {%r13425, %r13426, %r13427, %r13428}; | |
mov.u32 %r11862, %r13428; | |
mov.u32 %r11864, %r13427; | |
mov.u32 %r11866, %r13426; | |
mov.u32 %r11868, %r13425; | |
mov.u32 %r11870, %r13424; | |
mov.u32 %r11872, %r13423; | |
mov.u32 %r11874, %r13422; | |
mov.u32 %r11876, %r13421; | |
mov.u32 %r11878, %r13420; | |
mov.u32 %r11880, %r13419; | |
mov.u32 %r11882, %r13418; | |
mov.u32 %r11884, %r13417; | |
mov.u32 %r11886, %r13416; | |
mov.u32 %r11888, %r13415; | |
mov.u32 %r11890, %r13414; | |
mov.u32 %r11892, %r13413; | |
mov.u32 %r13428, %r379; | |
mov.u32 %r13427, %r380; | |
mov.u32 %r13426, %r381; | |
mov.u32 %r13425, %r382; | |
mov.u32 %r13424, %r383; | |
mov.u32 %r13423, %r384; | |
mov.u32 %r13422, %r385; | |
mov.u32 %r13421, %r386; | |
mov.u32 %r13420, %r387; | |
mov.u32 %r13419, %r388; | |
mov.u32 %r13418, %r389; | |
mov.u32 %r13417, %r390; | |
mov.u32 %r13416, %r391; | |
mov.u32 %r13415, %r392; | |
mov.u32 %r13414, %r393; | |
mov.u32 %r13413, %r394; | |
mov.u32 %r13429, %r11892; | |
mov.u32 %r13430, %r11890; | |
mov.u32 %r13431, %r11888; | |
mov.u32 %r13432, %r11886; | |
mov.u32 %r13433, %r11884; | |
mov.u32 %r13434, %r11882; | |
mov.u32 %r13435, %r11880; | |
mov.u32 %r13436, %r11878; | |
mov.u32 %r13437, %r11876; | |
mov.u32 %r13438, %r11874; | |
mov.u32 %r13439, %r11872; | |
mov.u32 %r13440, %r11870; | |
mov.u32 %r13441, %r11868; | |
mov.u32 %r13442, %r11866; | |
mov.u32 %r13443, %r11864; | |
mov.u32 %r13444, %r11862; | |
BB12_132: | |
mov.u32 %r426, %r13413; | |
mov.u32 %r425, %r13414; | |
mov.u32 %r424, %r13415; | |
mov.u32 %r423, %r13416; | |
mov.u32 %r422, %r13417; | |
mov.u32 %r421, %r13418; | |
mov.u32 %r420, %r13419; | |
mov.u32 %r419, %r13420; | |
mov.u32 %r418, %r13421; | |
mov.u32 %r417, %r13422; | |
mov.u32 %r416, %r13423; | |
mov.u32 %r415, %r13424; | |
mov.u32 %r414, %r13425; | |
mov.u32 %r413, %r13426; | |
mov.u32 %r412, %r13427; | |
mov.u32 %r411, %r13428; | |
mov.u32 %r410, %r13429; | |
mov.u32 %r409, %r13430; | |
mov.u32 %r408, %r13431; | |
mov.u32 %r407, %r13432; | |
mov.u32 %r406, %r13433; | |
mov.u32 %r405, %r13434; | |
mov.u32 %r404, %r13435; | |
mov.u32 %r403, %r13436; | |
mov.u32 %r402, %r13437; | |
mov.u32 %r401, %r13438; | |
mov.u32 %r400, %r13439; | |
mov.u32 %r399, %r13440; | |
mov.u32 %r398, %r13441; | |
mov.u32 %r397, %r13442; | |
mov.u32 %r396, %r13443; | |
mov.u32 %r395, %r13444; | |
setp.le.u32 %p69, %r13189, %r426; | |
mov.u32 %r13221, %r426; | |
mov.u32 %r13222, %r425; | |
mov.u32 %r13223, %r424; | |
mov.u32 %r13224, %r423; | |
mov.u32 %r13225, %r422; | |
mov.u32 %r13226, %r421; | |
mov.u32 %r13227, %r420; | |
mov.u32 %r13228, %r419; | |
mov.u32 %r13229, %r418; | |
mov.u32 %r13230, %r417; | |
mov.u32 %r13231, %r416; | |
mov.u32 %r13232, %r415; | |
mov.u32 %r13233, %r414; | |
mov.u32 %r13234, %r413; | |
mov.u32 %r13235, %r412; | |
mov.u32 %r13236, %r411; | |
mov.u32 %r13237, %r410; | |
mov.u32 %r13238, %r409; | |
mov.u32 %r13239, %r408; | |
mov.u32 %r13240, %r407; | |
mov.u32 %r13241, %r406; | |
mov.u32 %r13242, %r405; | |
mov.u32 %r13243, %r404; | |
mov.u32 %r13244, %r403; | |
mov.u32 %r13245, %r402; | |
mov.u32 %r13246, %r401; | |
mov.u32 %r13247, %r400; | |
mov.u32 %r13248, %r399; | |
mov.u32 %r13249, %r398; | |
mov.u32 %r13250, %r397; | |
mov.u32 %r13251, %r396; | |
mov.u32 %r13252, %r395; | |
@%p69 bra BB12_134; | |
st.local.v4.u32 [%rd2], {%r426, %r425, %r424, %r423}; | |
st.local.v4.u32 [%rd2+128], {%r13189, %r13190, %r13191, %r13192}; | |
st.local.v4.u32 [%rd2+16], {%r422, %r421, %r420, %r419}; | |
st.local.v4.u32 [%rd2+144], {%r13193, %r13194, %r13195, %r13196}; | |
st.local.v4.u32 [%rd2+32], {%r418, %r417, %r416, %r415}; | |
st.local.v4.u32 [%rd2+160], {%r13197, %r13198, %r13199, %r13200}; | |
st.local.v4.u32 [%rd2+48], {%r414, %r413, %r412, %r411}; | |
st.local.v4.u32 [%rd2+176], {%r13201, %r13202, %r13203, %r13204}; | |
st.local.v4.u32 [%rd2+64], {%r410, %r409, %r408, %r407}; | |
st.local.v4.u32 [%rd2+192], {%r13205, %r13206, %r13207, %r13208}; | |
st.local.v4.u32 [%rd2+80], {%r406, %r405, %r404, %r403}; | |
st.local.v4.u32 [%rd2+208], {%r13209, %r13210, %r13211, %r13212}; | |
st.local.v4.u32 [%rd2+96], {%r402, %r401, %r400, %r399}; | |
st.local.v4.u32 [%rd2+224], {%r13213, %r13214, %r13215, %r13216}; | |
st.local.v4.u32 [%rd2+112], {%r398, %r397, %r396, %r395}; | |
st.local.v4.u32 [%rd2+240], {%r13217, %r13218, %r13219, %r13220}; | |
mov.u32 %r11686, %r13220; | |
mov.u32 %r11688, %r13219; | |
mov.u32 %r11690, %r13218; | |
mov.u32 %r11692, %r13217; | |
mov.u32 %r11694, %r13216; | |
mov.u32 %r11696, %r13215; | |
mov.u32 %r11698, %r13214; | |
mov.u32 %r11700, %r13213; | |
mov.u32 %r11702, %r13212; | |
mov.u32 %r11704, %r13211; | |
mov.u32 %r11706, %r13210; | |
mov.u32 %r11708, %r13209; | |
mov.u32 %r11710, %r13208; | |
mov.u32 %r11712, %r13207; | |
mov.u32 %r11714, %r13206; | |
mov.u32 %r11716, %r13205; | |
mov.u32 %r11718, %r13204; | |
mov.u32 %r11720, %r13203; | |
mov.u32 %r11722, %r13202; | |
mov.u32 %r11724, %r13201; | |
mov.u32 %r11726, %r13200; | |
mov.u32 %r11728, %r13199; | |
mov.u32 %r11730, %r13198; | |
mov.u32 %r11732, %r13197; | |
mov.u32 %r11734, %r13196; | |
mov.u32 %r11736, %r13195; | |
mov.u32 %r11738, %r13194; | |
mov.u32 %r11740, %r13193; | |
mov.u32 %r11742, %r13192; | |
mov.u32 %r11744, %r13191; | |
mov.u32 %r11746, %r13190; | |
mov.u32 %r11748, %r13189; | |
mov.u32 %r13220, %r395; | |
mov.u32 %r13219, %r396; | |
mov.u32 %r13218, %r397; | |
mov.u32 %r13217, %r398; | |
mov.u32 %r13216, %r399; | |
mov.u32 %r13215, %r400; | |
mov.u32 %r13214, %r401; | |
mov.u32 %r13213, %r402; | |
mov.u32 %r13212, %r403; | |
mov.u32 %r13211, %r404; | |
mov.u32 %r13210, %r405; | |
mov.u32 %r13209, %r406; | |
mov.u32 %r13208, %r407; | |
mov.u32 %r13207, %r408; | |
mov.u32 %r13206, %r409; | |
mov.u32 %r13205, %r410; | |
mov.u32 %r13204, %r411; | |
mov.u32 %r13203, %r412; | |
mov.u32 %r13202, %r413; | |
mov.u32 %r13201, %r414; | |
mov.u32 %r13200, %r415; | |
mov.u32 %r13199, %r416; | |
mov.u32 %r13198, %r417; | |
mov.u32 %r13197, %r418; | |
mov.u32 %r13196, %r419; | |
mov.u32 %r13195, %r420; | |
mov.u32 %r13194, %r421; | |
mov.u32 %r13193, %r422; | |
mov.u32 %r13192, %r423; | |
mov.u32 %r13191, %r424; | |
mov.u32 %r13190, %r425; | |
mov.u32 %r13189, %r426; | |
mov.u32 %r13221, %r11748; | |
mov.u32 %r13222, %r11746; | |
mov.u32 %r13223, %r11744; | |
mov.u32 %r13224, %r11742; | |
mov.u32 %r13225, %r11740; | |
mov.u32 %r13226, %r11738; | |
mov.u32 %r13227, %r11736; | |
mov.u32 %r13228, %r11734; | |
mov.u32 %r13229, %r11732; | |
mov.u32 %r13230, %r11730; | |
mov.u32 %r13231, %r11728; | |
mov.u32 %r13232, %r11726; | |
mov.u32 %r13233, %r11724; | |
mov.u32 %r13234, %r11722; | |
mov.u32 %r13235, %r11720; | |
mov.u32 %r13236, %r11718; | |
mov.u32 %r13237, %r11716; | |
mov.u32 %r13238, %r11714; | |
mov.u32 %r13239, %r11712; | |
mov.u32 %r13240, %r11710; | |
mov.u32 %r13241, %r11708; | |
mov.u32 %r13242, %r11706; | |
mov.u32 %r13243, %r11704; | |
mov.u32 %r13244, %r11702; | |
mov.u32 %r13245, %r11700; | |
mov.u32 %r13246, %r11698; | |
mov.u32 %r13247, %r11696; | |
mov.u32 %r13248, %r11694; | |
mov.u32 %r13249, %r11692; | |
mov.u32 %r13250, %r11690; | |
mov.u32 %r13251, %r11688; | |
mov.u32 %r13252, %r11686; | |
BB12_134: | |
mov.u32 %r13061, %r13189; | |
mov.u32 %r13062, %r13190; | |
mov.u32 %r13063, %r13191; | |
mov.u32 %r13064, %r13192; | |
mov.u32 %r13065, %r13193; | |
mov.u32 %r13066, %r13194; | |
mov.u32 %r13067, %r13195; | |
mov.u32 %r13068, %r13196; | |
mov.u32 %r13069, %r13197; | |
mov.u32 %r13070, %r13198; | |
mov.u32 %r13071, %r13199; | |
mov.u32 %r13072, %r13200; | |
mov.u32 %r13073, %r13201; | |
mov.u32 %r13074, %r13202; | |
mov.u32 %r13075, %r13203; | |
mov.u32 %r13076, %r13204; | |
mov.u32 %r13077, %r13205; | |
mov.u32 %r13078, %r13206; | |
mov.u32 %r13079, %r13207; | |
mov.u32 %r13080, %r13208; | |
mov.u32 %r13081, %r13209; | |
mov.u32 %r13082, %r13210; | |
mov.u32 %r13083, %r13211; | |
mov.u32 %r13084, %r13212; | |
mov.u32 %r13085, %r13213; | |
mov.u32 %r13086, %r13214; | |
mov.u32 %r13087, %r13215; | |
mov.u32 %r13088, %r13216; | |
mov.u32 %r13089, %r13217; | |
mov.u32 %r13090, %r13218; | |
mov.u32 %r13091, %r13219; | |
mov.u32 %r13092, %r13220; | |
mov.u32 %r13093, %r13221; | |
mov.u32 %r13094, %r13222; | |
mov.u32 %r13095, %r13223; | |
mov.u32 %r13096, %r13224; | |
mov.u32 %r13097, %r13225; | |
mov.u32 %r13098, %r13226; | |
mov.u32 %r13099, %r13227; | |
mov.u32 %r13100, %r13228; | |
mov.u32 %r13101, %r13229; | |
mov.u32 %r13102, %r13230; | |
mov.u32 %r13103, %r13231; | |
mov.u32 %r13104, %r13232; | |
mov.u32 %r13105, %r13233; | |
mov.u32 %r13106, %r13234; | |
mov.u32 %r13107, %r13235; | |
mov.u32 %r13108, %r13236; | |
mov.u32 %r13109, %r13237; | |
mov.u32 %r13110, %r13238; | |
mov.u32 %r13111, %r13239; | |
mov.u32 %r13112, %r13240; | |
mov.u32 %r13113, %r13241; | |
mov.u32 %r13114, %r13242; | |
mov.u32 %r13115, %r13243; | |
mov.u32 %r13116, %r13244; | |
mov.u32 %r13117, %r13245; | |
mov.u32 %r13118, %r13246; | |
mov.u32 %r13119, %r13247; | |
mov.u32 %r13120, %r13248; | |
mov.u32 %r13121, %r13249; | |
mov.u32 %r13122, %r13250; | |
mov.u32 %r13123, %r13251; | |
mov.u32 %r13124, %r13252; | |
mul.lo.s64 %rd901, %rd15, 1792; | |
add.s64 %rd902, %rd4, %rd901; | |
bfe.u32 %r5722, %r11, 22, 6; | |
mul.wide.u32 %rd903, %r5722, 28; | |
add.s64 %rd904, %rd902, %rd903; | |
ld.global.u32 %r491, [%rd904+-4]; | |
and.b32 %r5723, %r491, 65535; | |
mul.wide.u32 %rd905, %r5723, 1792; | |
add.s64 %rd906, %rd6, %rd905; | |
bfe.u32 %r5724, %r491, 16, 6; | |
mul.wide.u32 %rd907, %r5724, 28; | |
add.s64 %rd908, %rd906, %rd907; | |
ld.global.u32 %r492, [%rd908+-4]; | |
and.b32 %r5725, %r492, 65535; | |
mul.wide.u32 %rd909, %r5725, 1792; | |
add.s64 %rd910, %rd4, %rd909; | |
bfe.u32 %r5726, %r492, 16, 6; | |
mul.wide.u32 %rd911, %r5726, 28; | |
add.s64 %rd912, %rd910, %rd911; | |
ld.global.u32 %r493, [%rd912+-8]; | |
and.b32 %r5727, %r493, 65535; | |
mul.wide.u32 %rd913, %r5727, 1792; | |
add.s64 %rd914, %rd6, %rd913; | |
bfe.u32 %r5728, %r493, 16, 6; | |
mul.wide.u32 %rd915, %r5728, 28; | |
add.s64 %rd916, %rd914, %rd915; | |
ld.global.u32 %r494, [%rd916+-8]; | |
and.b32 %r5729, %r494, 65535; | |
mul.wide.u32 %rd917, %r5729, 1792; | |
add.s64 %rd918, %rd4, %rd917; | |
cvt.u64.u32 %rd48, %r5723; | |
cvt.u64.u32 %rd49, %r5725; | |
cvt.u64.u32 %rd50, %r5727; | |
cvt.u64.u32 %rd51, %r5729; | |
bfe.u32 %r5730, %r494, 16, 6; | |
mul.wide.u32 %rd919, %r5730, 28; | |
add.s64 %rd920, %rd918, %rd919; | |
ld.global.u32 %r495, [%rd920+-12]; | |
and.b32 %r5731, %r495, 65535; | |
cvt.u64.u32 %rd52, %r5731; | |
bfe.u32 %r5732, %r495, 16, 6; | |
mul.wide.u32 %rd921, %r5731, 1792; | |
add.s64 %rd922, %rd415, %rd921; | |
mul.wide.u32 %rd923, %r5732, 28; | |
add.s64 %rd924, %rd922, %rd923; | |
ld.global.u32 %r5733, [%rd924]; | |
and.b32 %r5734, %r5733, 65535; | |
bfe.u32 %r5735, %r5733, 16, 6; | |
mul.wide.u32 %rd925, %r5734, 1792; | |
add.s64 %rd926, %rd414, %rd925; | |
mul.wide.u32 %rd927, %r5735, 28; | |
add.s64 %rd928, %rd926, %rd927; | |
ld.global.u32 %r5736, [%rd928]; | |
and.b32 %r5737, %r5736, 65535; | |
shl.b32 %r5738, %r5737, 6; | |
bfe.u32 %r5739, %r5736, 16, 6; | |
or.b32 %r496, %r5738, %r5739; | |
st.local.u32 [%rd2+256], %r496; | |
bfe.u32 %r5740, %r5733, 22, 6; | |
mul.wide.u32 %rd929, %r5740, 28; | |
add.s64 %rd930, %rd926, %rd929; | |
ld.global.u32 %r5741, [%rd930]; | |
and.b32 %r5742, %r5741, 65535; | |
shl.b32 %r5743, %r5742, 6; | |
bfe.u32 %r5744, %r5741, 16, 6; | |
or.b32 %r13698, %r5743, %r5744; | |
st.local.u32 [%rd2+260], %r13698; | |
setp.le.u32 %p70, %r496, %r13698; | |
mov.u32 %r13697, %r496; | |
@%p70 bra BB12_136; | |
st.local.v2.u32 [%rd2+256], {%r13698, %r496}; | |
mov.u32 %r12229, %r13698; | |
mov.u32 %r13698, %r496; | |
mov.u32 %r13697, %r12229; | |
BB12_136: | |
mov.u32 %r13693, %r13697; | |
mov.u32 %r13694, %r13698; | |
bfe.u32 %r5745, %r495, 22, 6; | |
mul.lo.s64 %rd931, %rd52, 1792; | |
add.s64 %rd932, %rd415, %rd931; | |
mul.wide.u32 %rd933, %r5745, 28; | |
add.s64 %rd934, %rd932, %rd933; | |
ld.global.u32 %r5746, [%rd934]; | |
and.b32 %r5747, %r5746, 65535; | |
bfe.u32 %r5748, %r5746, 16, 6; | |
mul.wide.u32 %rd935, %r5747, 1792; | |
add.s64 %rd936, %rd414, %rd935; | |
mul.wide.u32 %rd937, %r5748, 28; | |
add.s64 %rd938, %rd936, %rd937; | |
ld.global.u32 %r5749, [%rd938]; | |
and.b32 %r5750, %r5749, 65535; | |
shl.b32 %r5751, %r5750, 6; | |
bfe.u32 %r5752, %r5749, 16, 6; | |
or.b32 %r500, %r5751, %r5752; | |
st.local.u32 [%rd2+264], %r500; | |
bfe.u32 %r5753, %r5746, 22, 6; | |
mul.wide.u32 %rd939, %r5753, 28; | |
add.s64 %rd940, %rd936, %rd939; | |
ld.global.u32 %r5754, [%rd940]; | |
and.b32 %r5755, %r5754, 65535; | |
shl.b32 %r5756, %r5755, 6; | |
bfe.u32 %r5757, %r5754, 16, 6; | |
or.b32 %r13700, %r5756, %r5757; | |
st.local.u32 [%rd2+268], %r13700; | |
setp.le.u32 %p71, %r500, %r13700; | |
mov.u32 %r13699, %r500; | |
@%p71 bra BB12_138; | |
st.local.v2.u32 [%rd2+264], {%r13700, %r500}; | |
mov.u32 %r12235, %r13700; | |
mov.u32 %r13700, %r500; | |
mov.u32 %r13699, %r12235; | |
BB12_138: | |
mov.u32 %r503, %r13699; | |
mov.u32 %r502, %r13700; | |
setp.le.u32 %p72, %r13693, %r503; | |
mov.u32 %r13695, %r503; | |
mov.u32 %r13696, %r502; | |
@%p72 bra BB12_140; | |
st.local.v4.u32 [%rd2+256], {%r503, %r502, %r13693, %r13694}; | |
mov.u32 %r12232, %r13694; | |
mov.u32 %r12234, %r13693; | |
mov.u32 %r13694, %r502; | |
mov.u32 %r13693, %r503; | |
mov.u32 %r13695, %r12234; | |
mov.u32 %r13696, %r12232; | |
BB12_140: | |
mov.u32 %r13685, %r13693; | |
mov.u32 %r13686, %r13694; | |
mov.u32 %r13687, %r13695; | |
mov.u32 %r13688, %r13696; | |
mul.lo.s64 %rd941, %rd51, 1792; | |
add.s64 %rd942, %rd4, %rd941; | |
bfe.u32 %r5758, %r494, 22, 6; | |
mul.wide.u32 %rd943, %r5758, 28; | |
add.s64 %rd944, %rd942, %rd943; | |
ld.global.u32 %r508, [%rd944+-12]; | |
and.b32 %r5759, %r508, 65535; | |
cvt.u64.u32 %rd53, %r5759; | |
bfe.u32 %r5760, %r508, 16, 6; | |
mul.wide.u32 %rd945, %r5759, 1792; | |
add.s64 %rd946, %rd415, %rd945; | |
mul.wide.u32 %rd947, %r5760, 28; | |
add.s64 %rd948, %rd946, %rd947; | |
ld.global.u32 %r5761, [%rd948]; | |
and.b32 %r5762, %r5761, 65535; | |
bfe.u32 %r5763, %r5761, 16, 6; | |
mul.wide.u32 %rd949, %r5762, 1792; | |
add.s64 %rd950, %rd414, %rd949; | |
mul.wide.u32 %rd951, %r5763, 28; | |
add.s64 %rd952, %rd950, %rd951; | |
ld.global.u32 %r5764, [%rd952]; | |
and.b32 %r5765, %r5764, 65535; | |
shl.b32 %r5766, %r5765, 6; | |
bfe.u32 %r5767, %r5764, 16, 6; | |
or.b32 %r509, %r5766, %r5767; | |
st.local.u32 [%rd2+272], %r509; | |
bfe.u32 %r5768, %r5761, 22, 6; | |
mul.wide.u32 %rd953, %r5768, 28; | |
add.s64 %rd954, %rd950, %rd953; | |
ld.global.u32 %r5769, [%rd954]; | |
and.b32 %r5770, %r5769, 65535; | |
shl.b32 %r5771, %r5770, 6; | |
bfe.u32 %r5772, %r5769, 16, 6; | |
or.b32 %r13706, %r5771, %r5772; | |
st.local.u32 [%rd2+276], %r13706; | |
setp.le.u32 %p73, %r509, %r13706; | |
mov.u32 %r13705, %r509; | |
@%p73 bra BB12_142; | |
st.local.v2.u32 [%rd2+272], {%r13706, %r509}; | |
mov.u32 %r12249, %r13706; | |
mov.u32 %r13706, %r509; | |
mov.u32 %r13705, %r12249; | |
BB12_142: | |
mov.u32 %r13701, %r13705; | |
mov.u32 %r13702, %r13706; | |
bfe.u32 %r5773, %r508, 22, 6; | |
mul.lo.s64 %rd955, %rd53, 1792; | |
add.s64 %rd956, %rd415, %rd955; | |
mul.wide.u32 %rd957, %r5773, 28; | |
add.s64 %rd958, %rd956, %rd957; | |
ld.global.u32 %r5774, [%rd958]; | |
and.b32 %r5775, %r5774, 65535; | |
bfe.u32 %r5776, %r5774, 16, 6; | |
mul.wide.u32 %rd959, %r5775, 1792; | |
add.s64 %rd960, %rd414, %rd959; | |
mul.wide.u32 %rd961, %r5776, 28; | |
add.s64 %rd962, %rd960, %rd961; | |
ld.global.u32 %r5777, [%rd962]; | |
and.b32 %r5778, %r5777, 65535; | |
shl.b32 %r5779, %r5778, 6; | |
bfe.u32 %r5780, %r5777, 16, 6; | |
or.b32 %r513, %r5779, %r5780; | |
st.local.u32 [%rd2+280], %r513; | |
bfe.u32 %r5781, %r5774, 22, 6; | |
mul.wide.u32 %rd963, %r5781, 28; | |
add.s64 %rd964, %rd960, %rd963; | |
ld.global.u32 %r5782, [%rd964]; | |
and.b32 %r5783, %r5782, 65535; | |
shl.b32 %r5784, %r5783, 6; | |
bfe.u32 %r5785, %r5782, 16, 6; | |
or.b32 %r13708, %r5784, %r5785; | |
st.local.u32 [%rd2+284], %r13708; | |
setp.le.u32 %p74, %r513, %r13708; | |
mov.u32 %r13707, %r513; | |
@%p74 bra BB12_144; | |
st.local.v2.u32 [%rd2+280], {%r13708, %r513}; | |
mov.u32 %r12255, %r13708; | |
mov.u32 %r13708, %r513; | |
mov.u32 %r13707, %r12255; | |
BB12_144: | |
mov.u32 %r516, %r13707; | |
mov.u32 %r515, %r13708; | |
setp.le.u32 %p75, %r13701, %r516; | |
mov.u32 %r13703, %r516; | |
mov.u32 %r13704, %r515; | |
@%p75 bra BB12_146; | |
st.local.v4.u32 [%rd2+272], {%r516, %r515, %r13701, %r13702}; | |
mov.u32 %r12252, %r13702; | |
mov.u32 %r12254, %r13701; | |
mov.u32 %r13702, %r515; | |
mov.u32 %r13701, %r516; | |
mov.u32 %r13703, %r12254; | |
mov.u32 %r13704, %r12252; | |
BB12_146: | |
mov.u32 %r520, %r13701; | |
mov.u32 %r519, %r13702; | |
mov.u32 %r518, %r13703; | |
mov.u32 %r517, %r13704; | |
setp.le.u32 %p76, %r13685, %r520; | |
mov.u32 %r13689, %r520; | |
mov.u32 %r13690, %r519; | |
mov.u32 %r13691, %r518; | |
mov.u32 %r13692, %r517; | |
@%p76 bra BB12_148; | |
st.local.v4.u32 [%rd2+256], {%r520, %r519, %r518, %r517}; | |
st.local.v4.u32 [%rd2+272], {%r13685, %r13686, %r13687, %r13688}; | |
mov.u32 %r12242, %r13688; | |
mov.u32 %r12244, %r13687; | |
mov.u32 %r12246, %r13686; | |
mov.u32 %r12248, %r13685; | |
mov.u32 %r13688, %r517; | |
mov.u32 %r13687, %r518; | |
mov.u32 %r13686, %r519; | |
mov.u32 %r13685, %r520; | |
mov.u32 %r13689, %r12248; | |
mov.u32 %r13690, %r12246; | |
mov.u32 %r13691, %r12244; | |
mov.u32 %r13692, %r12242; | |
BB12_148: | |
mov.u32 %r13669, %r13685; | |
mov.u32 %r13670, %r13686; | |
mov.u32 %r13671, %r13687; | |
mov.u32 %r13672, %r13688; | |
mov.u32 %r13673, %r13689; | |
mov.u32 %r13674, %r13690; | |
mov.u32 %r13675, %r13691; | |
mov.u32 %r13676, %r13692; | |
mul.lo.s64 %rd965, %rd50, 1792; | |
add.s64 %rd966, %rd6, %rd965; | |
bfe.u32 %r5786, %r493, 22, 6; | |
mul.wide.u32 %rd967, %r5786, 28; | |
add.s64 %rd968, %rd966, %rd967; | |
ld.global.u32 %r529, [%rd968+-8]; | |
and.b32 %r5787, %r529, 65535; | |
mul.wide.u32 %rd969, %r5787, 1792; | |
add.s64 %rd970, %rd4, %rd969; | |
cvt.u64.u32 %rd54, %r5787; | |
bfe.u32 %r5788, %r529, 16, 6; | |
mul.wide.u32 %rd971, %r5788, 28; | |
add.s64 %rd972, %rd970, %rd971; | |
ld.global.u32 %r530, [%rd972+-12]; | |
and.b32 %r5789, %r530, 65535; | |
cvt.u64.u32 %rd55, %r5789; | |
bfe.u32 %r5790, %r530, 16, 6; | |
mul.wide.u32 %rd973, %r5789, 1792; | |
add.s64 %rd974, %rd415, %rd973; | |
mul.wide.u32 %rd975, %r5790, 28; | |
add.s64 %rd976, %rd974, %rd975; | |
ld.global.u32 %r5791, [%rd976]; | |
and.b32 %r5792, %r5791, 65535; | |
bfe.u32 %r5793, %r5791, 16, 6; | |
mul.wide.u32 %rd977, %r5792, 1792; | |
add.s64 %rd978, %rd414, %rd977; | |
mul.wide.u32 %rd979, %r5793, 28; | |
add.s64 %rd980, %rd978, %rd979; | |
ld.global.u32 %r5794, [%rd980]; | |
and.b32 %r5795, %r5794, 65535; | |
shl.b32 %r5796, %r5795, 6; | |
bfe.u32 %r5797, %r5794, 16, 6; | |
or.b32 %r531, %r5796, %r5797; | |
st.local.u32 [%rd2+288], %r531; | |
bfe.u32 %r5798, %r5791, 22, 6; | |
mul.wide.u32 %rd981, %r5798, 28; | |
add.s64 %rd982, %rd978, %rd981; | |
ld.global.u32 %r5799, [%rd982]; | |
and.b32 %r5800, %r5799, 65535; | |
shl.b32 %r5801, %r5800, 6; | |
bfe.u32 %r5802, %r5799, 16, 6; | |
or.b32 %r13722, %r5801, %r5802; | |
st.local.u32 [%rd2+292], %r13722; | |
setp.le.u32 %p77, %r531, %r13722; | |
mov.u32 %r13721, %r531; | |
@%p77 bra BB12_150; | |
st.local.v2.u32 [%rd2+288], {%r13722, %r531}; | |
mov.u32 %r12285, %r13722; | |
mov.u32 %r13722, %r531; | |
mov.u32 %r13721, %r12285; | |
BB12_150: | |
mov.u32 %r13717, %r13721; | |
mov.u32 %r13718, %r13722; | |
bfe.u32 %r5803, %r530, 22, 6; | |
mul.lo.s64 %rd983, %rd55, 1792; | |
add.s64 %rd984, %rd415, %rd983; | |
mul.wide.u32 %rd985, %r5803, 28; | |
add.s64 %rd986, %rd984, %rd985; | |
ld.global.u32 %r5804, [%rd986]; | |
and.b32 %r5805, %r5804, 65535; | |
bfe.u32 %r5806, %r5804, 16, 6; | |
mul.wide.u32 %rd987, %r5805, 1792; | |
add.s64 %rd988, %rd414, %rd987; | |
mul.wide.u32 %rd989, %r5806, 28; | |
add.s64 %rd990, %rd988, %rd989; | |
ld.global.u32 %r5807, [%rd990]; | |
and.b32 %r5808, %r5807, 65535; | |
shl.b32 %r5809, %r5808, 6; | |
bfe.u32 %r5810, %r5807, 16, 6; | |
or.b32 %r535, %r5809, %r5810; | |
st.local.u32 [%rd2+296], %r535; | |
bfe.u32 %r5811, %r5804, 22, 6; | |
mul.wide.u32 %rd991, %r5811, 28; | |
add.s64 %rd992, %rd988, %rd991; | |
ld.global.u32 %r5812, [%rd992]; | |
and.b32 %r5813, %r5812, 65535; | |
shl.b32 %r5814, %r5813, 6; | |
bfe.u32 %r5815, %r5812, 16, 6; | |
or.b32 %r13724, %r5814, %r5815; | |
st.local.u32 [%rd2+300], %r13724; | |
setp.le.u32 %p78, %r535, %r13724; | |
mov.u32 %r13723, %r535; | |
@%p78 bra BB12_152; | |
st.local.v2.u32 [%rd2+296], {%r13724, %r535}; | |
mov.u32 %r12291, %r13724; | |
mov.u32 %r13724, %r535; | |
mov.u32 %r13723, %r12291; | |
BB12_152: | |
mov.u32 %r538, %r13723; | |
mov.u32 %r537, %r13724; | |
setp.le.u32 %p79, %r13717, %r538; | |
mov.u32 %r13719, %r538; | |
mov.u32 %r13720, %r537; | |
@%p79 bra BB12_154; | |
st.local.v4.u32 [%rd2+288], {%r538, %r537, %r13717, %r13718}; | |
mov.u32 %r12288, %r13718; | |
mov.u32 %r12290, %r13717; | |
mov.u32 %r13718, %r537; | |
mov.u32 %r13717, %r538; | |
mov.u32 %r13719, %r12290; | |
mov.u32 %r13720, %r12288; | |
BB12_154: | |
mov.u32 %r13709, %r13717; | |
mov.u32 %r13710, %r13718; | |
mov.u32 %r13711, %r13719; | |
mov.u32 %r13712, %r13720; | |
mul.lo.s64 %rd993, %rd54, 1792; | |
add.s64 %rd994, %rd4, %rd993; | |
bfe.u32 %r5816, %r529, 22, 6; | |
mul.wide.u32 %rd995, %r5816, 28; | |
add.s64 %rd996, %rd994, %rd995; | |
ld.global.u32 %r543, [%rd996+-12]; | |
and.b32 %r5817, %r543, 65535; | |
cvt.u64.u32 %rd56, %r5817; | |
bfe.u32 %r5818, %r543, 16, 6; | |
mul.wide.u32 %rd997, %r5817, 1792; | |
add.s64 %rd998, %rd415, %rd997; | |
mul.wide.u32 %rd999, %r5818, 28; | |
add.s64 %rd1000, %rd998, %rd999; | |
ld.global.u32 %r5819, [%rd1000]; | |
and.b32 %r5820, %r5819, 65535; | |
bfe.u32 %r5821, %r5819, 16, 6; | |
mul.wide.u32 %rd1001, %r5820, 1792; | |
add.s64 %rd1002, %rd414, %rd1001; | |
mul.wide.u32 %rd1003, %r5821, 28; | |
add.s64 %rd1004, %rd1002, %rd1003; | |
ld.global.u32 %r5822, [%rd1004]; | |
and.b32 %r5823, %r5822, 65535; | |
shl.b32 %r5824, %r5823, 6; | |
bfe.u32 %r5825, %r5822, 16, 6; | |
or.b32 %r544, %r5824, %r5825; | |
st.local.u32 [%rd2+304], %r544; | |
bfe.u32 %r5826, %r5819, 22, 6; | |
mul.wide.u32 %rd1005, %r5826, 28; | |
add.s64 %rd1006, %rd1002, %rd1005; | |
ld.global.u32 %r5827, [%rd1006]; | |
and.b32 %r5828, %r5827, 65535; | |
shl.b32 %r5829, %r5828, 6; | |
bfe.u32 %r5830, %r5827, 16, 6; | |
or.b32 %r13730, %r5829, %r5830; | |
st.local.u32 [%rd2+308], %r13730; | |
setp.le.u32 %p80, %r544, %r13730; | |
mov.u32 %r13729, %r544; | |
@%p80 bra BB12_156; | |
st.local.v2.u32 [%rd2+304], {%r13730, %r544}; | |
mov.u32 %r12305, %r13730; | |
mov.u32 %r13730, %r544; | |
mov.u32 %r13729, %r12305; | |
BB12_156: | |
mov.u32 %r13725, %r13729; | |
mov.u32 %r13726, %r13730; | |
bfe.u32 %r5831, %r543, 22, 6; | |
mul.lo.s64 %rd1007, %rd56, 1792; | |
add.s64 %rd1008, %rd415, %rd1007; | |
mul.wide.u32 %rd1009, %r5831, 28; | |
add.s64 %rd1010, %rd1008, %rd1009; | |
ld.global.u32 %r5832, [%rd1010]; | |
and.b32 %r5833, %r5832, 65535; | |
bfe.u32 %r5834, %r5832, 16, 6; | |
mul.wide.u32 %rd1011, %r5833, 1792; | |
add.s64 %rd1012, %rd414, %rd1011; | |
mul.wide.u32 %rd1013, %r5834, 28; | |
add.s64 %rd1014, %rd1012, %rd1013; | |
ld.global.u32 %r5835, [%rd1014]; | |
and.b32 %r5836, %r5835, 65535; | |
shl.b32 %r5837, %r5836, 6; | |
bfe.u32 %r5838, %r5835, 16, 6; | |
or.b32 %r548, %r5837, %r5838; | |
st.local.u32 [%rd2+312], %r548; | |
bfe.u32 %r5839, %r5832, 22, 6; | |
mul.wide.u32 %rd1015, %r5839, 28; | |
add.s64 %rd1016, %rd1012, %rd1015; | |
ld.global.u32 %r5840, [%rd1016]; | |
and.b32 %r5841, %r5840, 65535; | |
shl.b32 %r5842, %r5841, 6; | |
bfe.u32 %r5843, %r5840, 16, 6; | |
or.b32 %r13732, %r5842, %r5843; | |
st.local.u32 [%rd2+316], %r13732; | |
setp.le.u32 %p81, %r548, %r13732; | |
mov.u32 %r13731, %r548; | |
@%p81 bra BB12_158; | |
st.local.v2.u32 [%rd2+312], {%r13732, %r548}; | |
mov.u32 %r12311, %r13732; | |
mov.u32 %r13732, %r548; | |
mov.u32 %r13731, %r12311; | |
BB12_158: | |
mov.u32 %r551, %r13731; | |
mov.u32 %r550, %r13732; | |
setp.le.u32 %p82, %r13725, %r551; | |
mov.u32 %r13727, %r551; | |
mov.u32 %r13728, %r550; | |
@%p82 bra BB12_160; | |
st.local.v4.u32 [%rd2+304], {%r551, %r550, %r13725, %r13726}; | |
mov.u32 %r12308, %r13726; | |
mov.u32 %r12310, %r13725; | |
mov.u32 %r13726, %r550; | |
mov.u32 %r13725, %r551; | |
mov.u32 %r13727, %r12310; | |
mov.u32 %r13728, %r12308; | |
BB12_160: | |
mov.u32 %r555, %r13725; | |
mov.u32 %r554, %r13726; | |
mov.u32 %r553, %r13727; | |
mov.u32 %r552, %r13728; | |
setp.le.u32 %p83, %r13709, %r555; | |
mov.u32 %r13713, %r555; | |
mov.u32 %r13714, %r554; | |
mov.u32 %r13715, %r553; | |
mov.u32 %r13716, %r552; | |
@%p83 bra BB12_162; | |
st.local.v4.u32 [%rd2+288], {%r555, %r554, %r553, %r552}; | |
st.local.v4.u32 [%rd2+304], {%r13709, %r13710, %r13711, %r13712}; | |
mov.u32 %r12298, %r13712; | |
mov.u32 %r12300, %r13711; | |
mov.u32 %r12302, %r13710; | |
mov.u32 %r12304, %r13709; | |
mov.u32 %r13712, %r552; | |
mov.u32 %r13711, %r553; | |
mov.u32 %r13710, %r554; | |
mov.u32 %r13709, %r555; | |
mov.u32 %r13713, %r12304; | |
mov.u32 %r13714, %r12302; | |
mov.u32 %r13715, %r12300; | |
mov.u32 %r13716, %r12298; | |
BB12_162: | |
mov.u32 %r563, %r13709; | |
mov.u32 %r562, %r13710; | |
mov.u32 %r561, %r13711; | |
mov.u32 %r560, %r13712; | |
mov.u32 %r559, %r13713; | |
mov.u32 %r558, %r13714; | |
mov.u32 %r557, %r13715; | |
mov.u32 %r556, %r13716; | |
setp.le.u32 %p84, %r13669, %r563; | |
mov.u32 %r13677, %r563; | |
mov.u32 %r13678, %r562; | |
mov.u32 %r13679, %r561; | |
mov.u32 %r13680, %r560; | |
mov.u32 %r13681, %r559; | |
mov.u32 %r13682, %r558; | |
mov.u32 %r13683, %r557; | |
mov.u32 %r13684, %r556; | |
@%p84 bra BB12_164; | |
st.local.v4.u32 [%rd2+256], {%r563, %r562, %r561, %r560}; | |
st.local.v4.u32 [%rd2+288], {%r13669, %r13670, %r13671, %r13672}; | |
st.local.v4.u32 [%rd2+272], {%r559, %r558, %r557, %r556}; | |
st.local.v4.u32 [%rd2+304], {%r13673, %r13674, %r13675, %r13676}; | |
mov.u32 %r12270, %r13676; | |
mov.u32 %r12272, %r13675; | |
mov.u32 %r12274, %r13674; | |
mov.u32 %r12276, %r13673; | |
mov.u32 %r12278, %r13672; | |
mov.u32 %r12280, %r13671; | |
mov.u32 %r12282, %r13670; | |
mov.u32 %r12284, %r13669; | |
mov.u32 %r13676, %r556; | |
mov.u32 %r13675, %r557; | |
mov.u32 %r13674, %r558; | |
mov.u32 %r13673, %r559; | |
mov.u32 %r13672, %r560; | |
mov.u32 %r13671, %r561; | |
mov.u32 %r13670, %r562; | |
mov.u32 %r13669, %r563; | |
mov.u32 %r13677, %r12284; | |
mov.u32 %r13678, %r12282; | |
mov.u32 %r13679, %r12280; | |
mov.u32 %r13680, %r12278; | |
mov.u32 %r13681, %r12276; | |
mov.u32 %r13682, %r12274; | |
mov.u32 %r13683, %r12272; | |
mov.u32 %r13684, %r12270; | |
BB12_164: | |
mov.u32 %r13637, %r13669; | |
mov.u32 %r13638, %r13670; | |
mov.u32 %r13639, %r13671; | |
mov.u32 %r13640, %r13672; | |
mov.u32 %r13641, %r13673; | |
mov.u32 %r13642, %r13674; | |
mov.u32 %r13643, %r13675; | |
mov.u32 %r13644, %r13676; | |
mov.u32 %r13645, %r13677; | |
mov.u32 %r13646, %r13678; | |
mov.u32 %r13647, %r13679; | |
mov.u32 %r13648, %r13680; | |
mov.u32 %r13649, %r13681; | |
mov.u32 %r13650, %r13682; | |
mov.u32 %r13651, %r13683; | |
mov.u32 %r13652, %r13684; | |
mul.lo.s64 %rd1017, %rd49, 1792; | |
add.s64 %rd1018, %rd4, %rd1017; | |
bfe.u32 %r5844, %r492, 22, 6; | |
mul.wide.u32 %rd1019, %r5844, 28; | |
add.s64 %rd1020, %rd1018, %rd1019; | |
ld.global.u32 %r580, [%rd1020+-8]; | |
and.b32 %r5845, %r580, 65535; | |
mul.wide.u32 %rd1021, %r5845, 1792; | |
add.s64 %rd1022, %rd6, %rd1021; | |
bfe.u32 %r5846, %r580, 16, 6; | |
mul.wide.u32 %rd1023, %r5846, 28; | |
add.s64 %rd1024, %rd1022, %rd1023; | |
ld.global.u32 %r581, [%rd1024+-8]; | |
and.b32 %r5847, %r581, 65535; | |
mul.wide.u32 %rd1025, %r5847, 1792; | |
add.s64 %rd1026, %rd4, %rd1025; | |
cvt.u64.u32 %rd57, %r5845; | |
cvt.u64.u32 %rd58, %r5847; | |
bfe.u32 %r5848, %r581, 16, 6; | |
mul.wide.u32 %rd1027, %r5848, 28; | |
add.s64 %rd1028, %rd1026, %rd1027; | |
ld.global.u32 %r582, [%rd1028+-12]; | |
and.b32 %r5849, %r582, 65535; | |
cvt.u64.u32 %rd59, %r5849; | |
bfe.u32 %r5850, %r582, 16, 6; | |
mul.wide.u32 %rd1029, %r5849, 1792; | |
add.s64 %rd1030, %rd415, %rd1029; | |
mul.wide.u32 %rd1031, %r5850, 28; | |
add.s64 %rd1032, %rd1030, %rd1031; | |
ld.global.u32 %r5851, [%rd1032]; | |
and.b32 %r5852, %r5851, 65535; | |
bfe.u32 %r5853, %r5851, 16, 6; | |
mul.wide.u32 %rd1033, %r5852, 1792; | |
add.s64 %rd1034, %rd414, %rd1033; | |
mul.wide.u32 %rd1035, %r5853, 28; | |
add.s64 %rd1036, %rd1034, %rd1035; | |
ld.global.u32 %r5854, [%rd1036]; | |
and.b32 %r5855, %r5854, 65535; | |
shl.b32 %r5856, %r5855, 6; | |
bfe.u32 %r5857, %r5854, 16, 6; | |
or.b32 %r583, %r5856, %r5857; | |
st.local.u32 [%rd2+320], %r583; | |
bfe.u32 %r5858, %r5851, 22, 6; | |
mul.wide.u32 %rd1037, %r5858, 28; | |
add.s64 %rd1038, %rd1034, %rd1037; | |
ld.global.u32 %r5859, [%rd1038]; | |
and.b32 %r5860, %r5859, 65535; | |
shl.b32 %r5861, %r5860, 6; | |
bfe.u32 %r5862, %r5859, 16, 6; | |
or.b32 %r13762, %r5861, %r5862; | |
st.local.u32 [%rd2+324], %r13762; | |
setp.le.u32 %p85, %r583, %r13762; | |
mov.u32 %r13761, %r583; | |
@%p85 bra BB12_166; | |
st.local.v2.u32 [%rd2+320], {%r13762, %r583}; | |
mov.u32 %r12373, %r13762; | |
mov.u32 %r13762, %r583; | |
mov.u32 %r13761, %r12373; | |
BB12_166: | |
mov.u32 %r13757, %r13761; | |
mov.u32 %r13758, %r13762; | |
bfe.u32 %r5863, %r582, 22, 6; | |
mul.lo.s64 %rd1039, %rd59, 1792; | |
add.s64 %rd1040, %rd415, %rd1039; | |
mul.wide.u32 %rd1041, %r5863, 28; | |
add.s64 %rd1042, %rd1040, %rd1041; | |
ld.global.u32 %r5864, [%rd1042]; | |
and.b32 %r5865, %r5864, 65535; | |
bfe.u32 %r5866, %r5864, 16, 6; | |
mul.wide.u32 %rd1043, %r5865, 1792; | |
add.s64 %rd1044, %rd414, %rd1043; | |
mul.wide.u32 %rd1045, %r5866, 28; | |
add.s64 %rd1046, %rd1044, %rd1045; | |
ld.global.u32 %r5867, [%rd1046]; | |
and.b32 %r5868, %r5867, 65535; | |
shl.b32 %r5869, %r5868, 6; | |
bfe.u32 %r5870, %r5867, 16, 6; | |
or.b32 %r587, %r5869, %r5870; | |
st.local.u32 [%rd2+328], %r587; | |
bfe.u32 %r5871, %r5864, 22, 6; | |
mul.wide.u32 %rd1047, %r5871, 28; | |
add.s64 %rd1048, %rd1044, %rd1047; | |
ld.global.u32 %r5872, [%rd1048]; | |
and.b32 %r5873, %r5872, 65535; | |
shl.b32 %r5874, %r5873, 6; | |
bfe.u32 %r5875, %r5872, 16, 6; | |
or.b32 %r13764, %r5874, %r5875; | |
st.local.u32 [%rd2+332], %r13764; | |
setp.le.u32 %p86, %r587, %r13764; | |
mov.u32 %r13763, %r587; | |
@%p86 bra BB12_168; | |
st.local.v2.u32 [%rd2+328], {%r13764, %r587}; | |
mov.u32 %r12379, %r13764; | |
mov.u32 %r13764, %r587; | |
mov.u32 %r13763, %r12379; | |
BB12_168: | |
mov.u32 %r590, %r13763; | |
mov.u32 %r589, %r13764; | |
setp.le.u32 %p87, %r13757, %r590; | |
mov.u32 %r13759, %r590; | |
mov.u32 %r13760, %r589; | |
@%p87 bra BB12_170; | |
st.local.v4.u32 [%rd2+320], {%r590, %r589, %r13757, %r13758}; | |
mov.u32 %r12376, %r13758; | |
mov.u32 %r12378, %r13757; | |
mov.u32 %r13758, %r589; | |
mov.u32 %r13757, %r590; | |
mov.u32 %r13759, %r12378; | |
mov.u32 %r13760, %r12376; | |
BB12_170: | |
mov.u32 %r13749, %r13757; | |
mov.u32 %r13750, %r13758; | |
mov.u32 %r13751, %r13759; | |
mov.u32 %r13752, %r13760; | |
mul.lo.s64 %rd1049, %rd58, 1792; | |
add.s64 %rd1050, %rd4, %rd1049; | |
bfe.u32 %r5876, %r581, 22, 6; | |
mul.wide.u32 %rd1051, %r5876, 28; | |
add.s64 %rd1052, %rd1050, %rd1051; | |
ld.global.u32 %r595, [%rd1052+-12]; | |
and.b32 %r5877, %r595, 65535; | |
cvt.u64.u32 %rd60, %r5877; | |
bfe.u32 %r5878, %r595, 16, 6; | |
mul.wide.u32 %rd1053, %r5877, 1792; | |
add.s64 %rd1054, %rd415, %rd1053; | |
mul.wide.u32 %rd1055, %r5878, 28; | |
add.s64 %rd1056, %rd1054, %rd1055; | |
ld.global.u32 %r5879, [%rd1056]; | |
and.b32 %r5880, %r5879, 65535; | |
bfe.u32 %r5881, %r5879, 16, 6; | |
mul.wide.u32 %rd1057, %r5880, 1792; | |
add.s64 %rd1058, %rd414, %rd1057; | |
mul.wide.u32 %rd1059, %r5881, 28; | |
add.s64 %rd1060, %rd1058, %rd1059; | |
ld.global.u32 %r5882, [%rd1060]; | |
and.b32 %r5883, %r5882, 65535; | |
shl.b32 %r5884, %r5883, 6; | |
bfe.u32 %r5885, %r5882, 16, 6; | |
or.b32 %r596, %r5884, %r5885; | |
st.local.u32 [%rd2+336], %r596; | |
bfe.u32 %r5886, %r5879, 22, 6; | |
mul.wide.u32 %rd1061, %r5886, 28; | |
add.s64 %rd1062, %rd1058, %rd1061; | |
ld.global.u32 %r5887, [%rd1062]; | |
and.b32 %r5888, %r5887, 65535; | |
shl.b32 %r5889, %r5888, 6; | |
bfe.u32 %r5890, %r5887, 16, 6; | |
or.b32 %r13770, %r5889, %r5890; | |
st.local.u32 [%rd2+340], %r13770; | |
setp.le.u32 %p88, %r596, %r13770; | |
mov.u32 %r13769, %r596; | |
@%p88 bra BB12_172; | |
st.local.v2.u32 [%rd2+336], {%r13770, %r596}; | |
mov.u32 %r12393, %r13770; | |
mov.u32 %r13770, %r596; | |
mov.u32 %r13769, %r12393; | |
BB12_172: | |
mov.u32 %r13765, %r13769; | |
mov.u32 %r13766, %r13770; | |
bfe.u32 %r5891, %r595, 22, 6; | |
mul.lo.s64 %rd1063, %rd60, 1792; | |
add.s64 %rd1064, %rd415, %rd1063; | |
mul.wide.u32 %rd1065, %r5891, 28; | |
add.s64 %rd1066, %rd1064, %rd1065; | |
ld.global.u32 %r5892, [%rd1066]; | |
and.b32 %r5893, %r5892, 65535; | |
bfe.u32 %r5894, %r5892, 16, 6; | |
mul.wide.u32 %rd1067, %r5893, 1792; | |
add.s64 %rd1068, %rd414, %rd1067; | |
mul.wide.u32 %rd1069, %r5894, 28; | |
add.s64 %rd1070, %rd1068, %rd1069; | |
ld.global.u32 %r5895, [%rd1070]; | |
and.b32 %r5896, %r5895, 65535; | |
shl.b32 %r5897, %r5896, 6; | |
bfe.u32 %r5898, %r5895, 16, 6; | |
or.b32 %r600, %r5897, %r5898; | |
st.local.u32 [%rd2+344], %r600; | |
bfe.u32 %r5899, %r5892, 22, 6; | |
mul.wide.u32 %rd1071, %r5899, 28; | |
add.s64 %rd1072, %rd1068, %rd1071; | |
ld.global.u32 %r5900, [%rd1072]; | |
and.b32 %r5901, %r5900, 65535; | |
shl.b32 %r5902, %r5901, 6; | |
bfe.u32 %r5903, %r5900, 16, 6; | |
or.b32 %r13772, %r5902, %r5903; | |
st.local.u32 [%rd2+348], %r13772; | |
setp.le.u32 %p89, %r600, %r13772; | |
mov.u32 %r13771, %r600; | |
@%p89 bra BB12_174; | |
st.local.v2.u32 [%rd2+344], {%r13772, %r600}; | |
mov.u32 %r12399, %r13772; | |
mov.u32 %r13772, %r600; | |
mov.u32 %r13771, %r12399; | |
BB12_174: | |
mov.u32 %r603, %r13771; | |
mov.u32 %r602, %r13772; | |
setp.le.u32 %p90, %r13765, %r603; | |
mov.u32 %r13767, %r603; | |
mov.u32 %r13768, %r602; | |
@%p90 bra BB12_176; | |
st.local.v4.u32 [%rd2+336], {%r603, %r602, %r13765, %r13766}; | |
mov.u32 %r12396, %r13766; | |
mov.u32 %r12398, %r13765; | |
mov.u32 %r13766, %r602; | |
mov.u32 %r13765, %r603; | |
mov.u32 %r13767, %r12398; | |
mov.u32 %r13768, %r12396; | |
BB12_176: | |
mov.u32 %r607, %r13765; | |
mov.u32 %r606, %r13766; | |
mov.u32 %r605, %r13767; | |
mov.u32 %r604, %r13768; | |
setp.le.u32 %p91, %r13749, %r607; | |
mov.u32 %r13753, %r607; | |
mov.u32 %r13754, %r606; | |
mov.u32 %r13755, %r605; | |
mov.u32 %r13756, %r604; | |
@%p91 bra BB12_178; | |
st.local.v4.u32 [%rd2+320], {%r607, %r606, %r605, %r604}; | |
st.local.v4.u32 [%rd2+336], {%r13749, %r13750, %r13751, %r13752}; | |
mov.u32 %r12386, %r13752; | |
mov.u32 %r12388, %r13751; | |
mov.u32 %r12390, %r13750; | |
mov.u32 %r12392, %r13749; | |
mov.u32 %r13752, %r604; | |
mov.u32 %r13751, %r605; | |
mov.u32 %r13750, %r606; | |
mov.u32 %r13749, %r607; | |
mov.u32 %r13753, %r12392; | |
mov.u32 %r13754, %r12390; | |
mov.u32 %r13755, %r12388; | |
mov.u32 %r13756, %r12386; | |
BB12_178: | |
mov.u32 %r13733, %r13749; | |
mov.u32 %r13734, %r13750; | |
mov.u32 %r13735, %r13751; | |
mov.u32 %r13736, %r13752; | |
mov.u32 %r13737, %r13753; | |
mov.u32 %r13738, %r13754; | |
mov.u32 %r13739, %r13755; | |
mov.u32 %r13740, %r13756; | |
mul.lo.s64 %rd1073, %rd57, 1792; | |
add.s64 %rd1074, %rd6, %rd1073; | |
bfe.u32 %r5904, %r580, 22, 6; | |
mul.wide.u32 %rd1075, %r5904, 28; | |
add.s64 %rd1076, %rd1074, %rd1075; | |
ld.global.u32 %r616, [%rd1076+-8]; | |
and.b32 %r5905, %r616, 65535; | |
mul.wide.u32 %rd1077, %r5905, 1792; | |
add.s64 %rd1078, %rd4, %rd1077; | |
cvt.u64.u32 %rd61, %r5905; | |
bfe.u32 %r5906, %r616, 16, 6; | |
mul.wide.u32 %rd1079, %r5906, 28; | |
add.s64 %rd1080, %rd1078, %rd1079; | |
ld.global.u32 %r617, [%rd1080+-12]; | |
and.b32 %r5907, %r617, 65535; | |
cvt.u64.u32 %rd62, %r5907; | |
bfe.u32 %r5908, %r617, 16, 6; | |
mul.wide.u32 %rd1081, %r5907, 1792; | |
add.s64 %rd1082, %rd415, %rd1081; | |
mul.wide.u32 %rd1083, %r5908, 28; | |
add.s64 %rd1084, %rd1082, %rd1083; | |
ld.global.u32 %r5909, [%rd1084]; | |
and.b32 %r5910, %r5909, 65535; | |
bfe.u32 %r5911, %r5909, 16, 6; | |
mul.wide.u32 %rd1085, %r5910, 1792; | |
add.s64 %rd1086, %rd414, %rd1085; | |
mul.wide.u32 %rd1087, %r5911, 28; | |
add.s64 %rd1088, %rd1086, %rd1087; | |
ld.global.u32 %r5912, [%rd1088]; | |
and.b32 %r5913, %r5912, 65535; | |
shl.b32 %r5914, %r5913, 6; | |
bfe.u32 %r5915, %r5912, 16, 6; | |
or.b32 %r618, %r5914, %r5915; | |
st.local.u32 [%rd2+352], %r618; | |
bfe.u32 %r5916, %r5909, 22, 6; | |
mul.wide.u32 %rd1089, %r5916, 28; | |
add.s64 %rd1090, %rd1086, %rd1089; | |
ld.global.u32 %r5917, [%rd1090]; | |
and.b32 %r5918, %r5917, 65535; | |
shl.b32 %r5919, %r5918, 6; | |
bfe.u32 %r5920, %r5917, 16, 6; | |
or.b32 %r13786, %r5919, %r5920; | |
st.local.u32 [%rd2+356], %r13786; | |
setp.le.u32 %p92, %r618, %r13786; | |
mov.u32 %r13785, %r618; | |
@%p92 bra BB12_180; | |
st.local.v2.u32 [%rd2+352], {%r13786, %r618}; | |
mov.u32 %r12429, %r13786; | |
mov.u32 %r13786, %r618; | |
mov.u32 %r13785, %r12429; | |
BB12_180: | |
mov.u32 %r13781, %r13785; | |
mov.u32 %r13782, %r13786; | |
bfe.u32 %r5921, %r617, 22, 6; | |
mul.lo.s64 %rd1091, %rd62, 1792; | |
add.s64 %rd1092, %rd415, %rd1091; | |
mul.wide.u32 %rd1093, %r5921, 28; | |
add.s64 %rd1094, %rd1092, %rd1093; | |
ld.global.u32 %r5922, [%rd1094]; | |
and.b32 %r5923, %r5922, 65535; | |
bfe.u32 %r5924, %r5922, 16, 6; | |
mul.wide.u32 %rd1095, %r5923, 1792; | |
add.s64 %rd1096, %rd414, %rd1095; | |
mul.wide.u32 %rd1097, %r5924, 28; | |
add.s64 %rd1098, %rd1096, %rd1097; | |
ld.global.u32 %r5925, [%rd1098]; | |
and.b32 %r5926, %r5925, 65535; | |
shl.b32 %r5927, %r5926, 6; | |
bfe.u32 %r5928, %r5925, 16, 6; | |
or.b32 %r622, %r5927, %r5928; | |
st.local.u32 [%rd2+360], %r622; | |
bfe.u32 %r5929, %r5922, 22, 6; | |
mul.wide.u32 %rd1099, %r5929, 28; | |
add.s64 %rd1100, %rd1096, %rd1099; | |
ld.global.u32 %r5930, [%rd1100]; | |
and.b32 %r5931, %r5930, 65535; | |
shl.b32 %r5932, %r5931, 6; | |
bfe.u32 %r5933, %r5930, 16, 6; | |
or.b32 %r13788, %r5932, %r5933; | |
st.local.u32 [%rd2+364], %r13788; | |
setp.le.u32 %p93, %r622, %r13788; | |
mov.u32 %r13787, %r622; | |
@%p93 bra BB12_182; | |
st.local.v2.u32 [%rd2+360], {%r13788, %r622}; | |
mov.u32 %r12435, %r13788; | |
mov.u32 %r13788, %r622; | |
mov.u32 %r13787, %r12435; | |
BB12_182: | |
mov.u32 %r625, %r13787; | |
mov.u32 %r624, %r13788; | |
setp.le.u32 %p94, %r13781, %r625; | |
mov.u32 %r13783, %r625; | |
mov.u32 %r13784, %r624; | |
@%p94 bra BB12_184; | |
st.local.v4.u32 [%rd2+352], {%r625, %r624, %r13781, %r13782}; | |
mov.u32 %r12432, %r13782; | |
mov.u32 %r12434, %r13781; | |
mov.u32 %r13782, %r624; | |
mov.u32 %r13781, %r625; | |
mov.u32 %r13783, %r12434; | |
mov.u32 %r13784, %r12432; | |
BB12_184: | |
mov.u32 %r13773, %r13781; | |
mov.u32 %r13774, %r13782; | |
mov.u32 %r13775, %r13783; | |
mov.u32 %r13776, %r13784; | |
mul.lo.s64 %rd1101, %rd61, 1792; | |
add.s64 %rd1102, %rd4, %rd1101; | |
bfe.u32 %r5934, %r616, 22, 6; | |
mul.wide.u32 %rd1103, %r5934, 28; | |
add.s64 %rd1104, %rd1102, %rd1103; | |
ld.global.u32 %r630, [%rd1104+-12]; | |
and.b32 %r5935, %r630, 65535; | |
cvt.u64.u32 %rd63, %r5935; | |
bfe.u32 %r5936, %r630, 16, 6; | |
mul.wide.u32 %rd1105, %r5935, 1792; | |
add.s64 %rd1106, %rd415, %rd1105; | |
mul.wide.u32 %rd1107, %r5936, 28; | |
add.s64 %rd1108, %rd1106, %rd1107; | |
ld.global.u32 %r5937, [%rd1108]; | |
and.b32 %r5938, %r5937, 65535; | |
bfe.u32 %r5939, %r5937, 16, 6; | |
mul.wide.u32 %rd1109, %r5938, 1792; | |
add.s64 %rd1110, %rd414, %rd1109; | |
mul.wide.u32 %rd1111, %r5939, 28; | |
add.s64 %rd1112, %rd1110, %rd1111; | |
ld.global.u32 %r5940, [%rd1112]; | |
and.b32 %r5941, %r5940, 65535; | |
shl.b32 %r5942, %r5941, 6; | |
bfe.u32 %r5943, %r5940, 16, 6; | |
or.b32 %r631, %r5942, %r5943; | |
st.local.u32 [%rd2+368], %r631; | |
bfe.u32 %r5944, %r5937, 22, 6; | |
mul.wide.u32 %rd1113, %r5944, 28; | |
add.s64 %rd1114, %rd1110, %rd1113; | |
ld.global.u32 %r5945, [%rd1114]; | |
and.b32 %r5946, %r5945, 65535; | |
shl.b32 %r5947, %r5946, 6; | |
bfe.u32 %r5948, %r5945, 16, 6; | |
or.b32 %r13794, %r5947, %r5948; | |
st.local.u32 [%rd2+372], %r13794; | |
setp.le.u32 %p95, %r631, %r13794; | |
mov.u32 %r13793, %r631; | |
@%p95 bra BB12_186; | |
st.local.v2.u32 [%rd2+368], {%r13794, %r631}; | |
mov.u32 %r12449, %r13794; | |
mov.u32 %r13794, %r631; | |
mov.u32 %r13793, %r12449; | |
BB12_186: | |
mov.u32 %r13789, %r13793; | |
mov.u32 %r13790, %r13794; | |
bfe.u32 %r5949, %r630, 22, 6; | |
mul.lo.s64 %rd1115, %rd63, 1792; | |
add.s64 %rd1116, %rd415, %rd1115; | |
mul.wide.u32 %rd1117, %r5949, 28; | |
add.s64 %rd1118, %rd1116, %rd1117; | |
ld.global.u32 %r5950, [%rd1118]; | |
and.b32 %r5951, %r5950, 65535; | |
bfe.u32 %r5952, %r5950, 16, 6; | |
mul.wide.u32 %rd1119, %r5951, 1792; | |
add.s64 %rd1120, %rd414, %rd1119; | |
mul.wide.u32 %rd1121, %r5952, 28; | |
add.s64 %rd1122, %rd1120, %rd1121; | |
ld.global.u32 %r5953, [%rd1122]; | |
and.b32 %r5954, %r5953, 65535; | |
shl.b32 %r5955, %r5954, 6; | |
bfe.u32 %r5956, %r5953, 16, 6; | |
or.b32 %r635, %r5955, %r5956; | |
st.local.u32 [%rd2+376], %r635; | |
bfe.u32 %r5957, %r5950, 22, 6; | |
mul.wide.u32 %rd1123, %r5957, 28; | |
add.s64 %rd1124, %rd1120, %rd1123; | |
ld.global.u32 %r5958, [%rd1124]; | |
and.b32 %r5959, %r5958, 65535; | |
shl.b32 %r5960, %r5959, 6; | |
bfe.u32 %r5961, %r5958, 16, 6; | |
or.b32 %r13796, %r5960, %r5961; | |
st.local.u32 [%rd2+380], %r13796; | |
setp.le.u32 %p96, %r635, %r13796; | |
mov.u32 %r13795, %r635; | |
@%p96 bra BB12_188; | |
st.local.v2.u32 [%rd2+376], {%r13796, %r635}; | |
mov.u32 %r12455, %r13796; | |
mov.u32 %r13796, %r635; | |
mov.u32 %r13795, %r12455; | |
BB12_188: | |
mov.u32 %r638, %r13795; | |
mov.u32 %r637, %r13796; | |
setp.le.u32 %p97, %r13789, %r638; | |
mov.u32 %r13791, %r638; | |
mov.u32 %r13792, %r637; | |
@%p97 bra BB12_190; | |
st.local.v4.u32 [%rd2+368], {%r638, %r637, %r13789, %r13790}; | |
mov.u32 %r12452, %r13790; | |
mov.u32 %r12454, %r13789; | |
mov.u32 %r13790, %r637; | |
mov.u32 %r13789, %r638; | |
mov.u32 %r13791, %r12454; | |
mov.u32 %r13792, %r12452; | |
BB12_190: | |
mov.u32 %r642, %r13789; | |
mov.u32 %r641, %r13790; | |
mov.u32 %r640, %r13791; | |
mov.u32 %r639, %r13792; | |
setp.le.u32 %p98, %r13773, %r642; | |
mov.u32 %r13777, %r642; | |
mov.u32 %r13778, %r641; | |
mov.u32 %r13779, %r640; | |
mov.u32 %r13780, %r639; | |
@%p98 bra BB12_192; | |
st.local.v4.u32 [%rd2+352], {%r642, %r641, %r640, %r639}; | |
st.local.v4.u32 [%rd2+368], {%r13773, %r13774, %r13775, %r13776}; | |
mov.u32 %r12442, %r13776; | |
mov.u32 %r12444, %r13775; | |
mov.u32 %r12446, %r13774; | |
mov.u32 %r12448, %r13773; | |
mov.u32 %r13776, %r639; | |
mov.u32 %r13775, %r640; | |
mov.u32 %r13774, %r641; | |
mov.u32 %r13773, %r642; | |
mov.u32 %r13777, %r12448; | |
mov.u32 %r13778, %r12446; | |
mov.u32 %r13779, %r12444; | |
mov.u32 %r13780, %r12442; | |
BB12_192: | |
mov.u32 %r650, %r13773; | |
mov.u32 %r649, %r13774; | |
mov.u32 %r648, %r13775; | |
mov.u32 %r647, %r13776; | |
mov.u32 %r646, %r13777; | |
mov.u32 %r645, %r13778; | |
mov.u32 %r644, %r13779; | |
mov.u32 %r643, %r13780; | |
setp.le.u32 %p99, %r13733, %r650; | |
mov.u32 %r13741, %r650; | |
mov.u32 %r13742, %r649; | |
mov.u32 %r13743, %r648; | |
mov.u32 %r13744, %r647; | |
mov.u32 %r13745, %r646; | |
mov.u32 %r13746, %r645; | |
mov.u32 %r13747, %r644; | |
mov.u32 %r13748, %r643; | |
@%p99 bra BB12_194; | |
st.local.v4.u32 [%rd2+320], {%r650, %r649, %r648, %r647}; | |
st.local.v4.u32 [%rd2+352], {%r13733, %r13734, %r13735, %r13736}; | |
st.local.v4.u32 [%rd2+336], {%r646, %r645, %r644, %r643}; | |
st.local.v4.u32 [%rd2+368], {%r13737, %r13738, %r13739, %r13740}; | |
mov.u32 %r12414, %r13740; | |
mov.u32 %r12416, %r13739; | |
mov.u32 %r12418, %r13738; | |
mov.u32 %r12420, %r13737; | |
mov.u32 %r12422, %r13736; | |
mov.u32 %r12424, %r13735; | |
mov.u32 %r12426, %r13734; | |
mov.u32 %r12428, %r13733; | |
mov.u32 %r13740, %r643; | |
mov.u32 %r13739, %r644; | |
mov.u32 %r13738, %r645; | |
mov.u32 %r13737, %r646; | |
mov.u32 %r13736, %r647; | |
mov.u32 %r13735, %r648; | |
mov.u32 %r13734, %r649; | |
mov.u32 %r13733, %r650; | |
mov.u32 %r13741, %r12428; | |
mov.u32 %r13742, %r12426; | |
mov.u32 %r13743, %r12424; | |
mov.u32 %r13744, %r12422; | |
mov.u32 %r13745, %r12420; | |
mov.u32 %r13746, %r12418; | |
mov.u32 %r13747, %r12416; | |
mov.u32 %r13748, %r12414; | |
BB12_194: | |
mov.u32 %r666, %r13733; | |
mov.u32 %r665, %r13734; | |
mov.u32 %r664, %r13735; | |
mov.u32 %r663, %r13736; | |
mov.u32 %r662, %r13737; | |
mov.u32 %r661, %r13738; | |
mov.u32 %r660, %r13739; | |
mov.u32 %r659, %r13740; | |
mov.u32 %r658, %r13741; | |
mov.u32 %r657, %r13742; | |
mov.u32 %r656, %r13743; | |
mov.u32 %r655, %r13744; | |
mov.u32 %r654, %r13745; | |
mov.u32 %r653, %r13746; | |
mov.u32 %r652, %r13747; | |
mov.u32 %r651, %r13748; | |
setp.le.u32 %p100, %r13637, %r666; | |
mov.u32 %r13653, %r666; | |
mov.u32 %r13654, %r665; | |
mov.u32 %r13655, %r664; | |
mov.u32 %r13656, %r663; | |
mov.u32 %r13657, %r662; | |
mov.u32 %r13658, %r661; | |
mov.u32 %r13659, %r660; | |
mov.u32 %r13660, %r659; | |
mov.u32 %r13661, %r658; | |
mov.u32 %r13662, %r657; | |
mov.u32 %r13663, %r656; | |
mov.u32 %r13664, %r655; | |
mov.u32 %r13665, %r654; | |
mov.u32 %r13666, %r653; | |
mov.u32 %r13667, %r652; | |
mov.u32 %r13668, %r651; | |
@%p100 bra BB12_196; | |
st.local.v4.u32 [%rd2+256], {%r666, %r665, %r664, %r663}; | |
st.local.v4.u32 [%rd2+320], {%r13637, %r13638, %r13639, %r13640}; | |
st.local.v4.u32 [%rd2+272], {%r662, %r661, %r660, %r659}; | |
st.local.v4.u32 [%rd2+336], {%r13641, %r13642, %r13643, %r13644}; | |
st.local.v4.u32 [%rd2+288], {%r658, %r657, %r656, %r655}; | |
st.local.v4.u32 [%rd2+352], {%r13645, %r13646, %r13647, %r13648}; | |
st.local.v4.u32 [%rd2+304], {%r654, %r653, %r652, %r651}; | |
st.local.v4.u32 [%rd2+368], {%r13649, %r13650, %r13651, %r13652}; | |
mov.u32 %r12342, %r13652; | |
mov.u32 %r12344, %r13651; | |
mov.u32 %r12346, %r13650; | |
mov.u32 %r12348, %r13649; | |
mov.u32 %r12350, %r13648; | |
mov.u32 %r12352, %r13647; | |
mov.u32 %r12354, %r13646; | |
mov.u32 %r12356, %r13645; | |
mov.u32 %r12358, %r13644; | |
mov.u32 %r12360, %r13643; | |
mov.u32 %r12362, %r13642; | |
mov.u32 %r12364, %r13641; | |
mov.u32 %r12366, %r13640; | |
mov.u32 %r12368, %r13639; | |
mov.u32 %r12370, %r13638; | |
mov.u32 %r12372, %r13637; | |
mov.u32 %r13652, %r651; | |
mov.u32 %r13651, %r652; | |
mov.u32 %r13650, %r653; | |
mov.u32 %r13649, %r654; | |
mov.u32 %r13648, %r655; | |
mov.u32 %r13647, %r656; | |
mov.u32 %r13646, %r657; | |
mov.u32 %r13645, %r658; | |
mov.u32 %r13644, %r659; | |
mov.u32 %r13643, %r660; | |
mov.u32 %r13642, %r661; | |
mov.u32 %r13641, %r662; | |
mov.u32 %r13640, %r663; | |
mov.u32 %r13639, %r664; | |
mov.u32 %r13638, %r665; | |
mov.u32 %r13637, %r666; | |
mov.u32 %r13653, %r12372; | |
mov.u32 %r13654, %r12370; | |
mov.u32 %r13655, %r12368; | |
mov.u32 %r13656, %r12366; | |
mov.u32 %r13657, %r12364; | |
mov.u32 %r13658, %r12362; | |
mov.u32 %r13659, %r12360; | |
mov.u32 %r13660, %r12358; | |
mov.u32 %r13661, %r12356; | |
mov.u32 %r13662, %r12354; | |
mov.u32 %r13663, %r12352; | |
mov.u32 %r13664, %r12350; | |
mov.u32 %r13665, %r12348; | |
mov.u32 %r13666, %r12346; | |
mov.u32 %r13667, %r12344; | |
mov.u32 %r13668, %r12342; | |
BB12_196: | |
mov.u32 %r13573, %r13637; | |
mov.u32 %r13574, %r13638; | |
mov.u32 %r13575, %r13639; | |
mov.u32 %r13576, %r13640; | |
mov.u32 %r13577, %r13641; | |
mov.u32 %r13578, %r13642; | |
mov.u32 %r13579, %r13643; | |
mov.u32 %r13580, %r13644; | |
mov.u32 %r13581, %r13645; | |
mov.u32 %r13582, %r13646; | |
mov.u32 %r13583, %r13647; | |
mov.u32 %r13584, %r13648; | |
mov.u32 %r13585, %r13649; | |
mov.u32 %r13586, %r13650; | |
mov.u32 %r13587, %r13651; | |
mov.u32 %r13588, %r13652; | |
mov.u32 %r13589, %r13653; | |
mov.u32 %r13590, %r13654; | |
mov.u32 %r13591, %r13655; | |
mov.u32 %r13592, %r13656; | |
mov.u32 %r13593, %r13657; | |
mov.u32 %r13594, %r13658; | |
mov.u32 %r13595, %r13659; | |
mov.u32 %r13596, %r13660; | |
mov.u32 %r13597, %r13661; | |
mov.u32 %r13598, %r13662; | |
mov.u32 %r13599, %r13663; | |
mov.u32 %r13600, %r13664; | |
mov.u32 %r13601, %r13665; | |
mov.u32 %r13602, %r13666; | |
mov.u32 %r13603, %r13667; | |
mov.u32 %r13604, %r13668; | |
mul.lo.s64 %rd1125, %rd48, 1792; | |
add.s64 %rd1126, %rd6, %rd1125; | |
bfe.u32 %r5962, %r491, 22, 6; | |
mul.wide.u32 %rd1127, %r5962, 28; | |
add.s64 %rd1128, %rd1126, %rd1127; | |
ld.global.u32 %r699, [%rd1128+-4]; | |
and.b32 %r5963, %r699, 65535; | |
mul.wide.u32 %rd1129, %r5963, 1792; | |
add.s64 %rd1130, %rd4, %rd1129; | |
bfe.u32 %r5964, %r699, 16, 6; | |
mul.wide.u32 %rd1131, %r5964, 28; | |
add.s64 %rd1132, %rd1130, %rd1131; | |
ld.global.u32 %r700, [%rd1132+-8]; | |
and.b32 %r5965, %r700, 65535; | |
mul.wide.u32 %rd1133, %r5965, 1792; | |
add.s64 %rd1134, %rd6, %rd1133; | |
bfe.u32 %r5966, %r700, 16, 6; | |
mul.wide.u32 %rd1135, %r5966, 28; | |
add.s64 %rd1136, %rd1134, %rd1135; | |
ld.global.u32 %r701, [%rd1136+-8]; | |
and.b32 %r5967, %r701, 65535; | |
mul.wide.u32 %rd1137, %r5967, 1792; | |
add.s64 %rd1138, %rd4, %rd1137; | |
cvt.u64.u32 %rd64, %r5963; | |
cvt.u64.u32 %rd65, %r5965; | |
cvt.u64.u32 %rd66, %r5967; | |
bfe.u32 %r5968, %r701, 16, 6; | |
mul.wide.u32 %rd1139, %r5968, 28; | |
add.s64 %rd1140, %rd1138, %rd1139; | |
ld.global.u32 %r702, [%rd1140+-12]; | |
and.b32 %r5969, %r702, 65535; | |
cvt.u64.u32 %rd67, %r5969; | |
bfe.u32 %r5970, %r702, 16, 6; | |
mul.wide.u32 %rd1141, %r5969, 1792; | |
add.s64 %rd1142, %rd415, %rd1141; | |
mul.wide.u32 %rd1143, %r5970, 28; | |
add.s64 %rd1144, %rd1142, %rd1143; | |
ld.global.u32 %r5971, [%rd1144]; | |
and.b32 %r5972, %r5971, 65535; | |
bfe.u32 %r5973, %r5971, 16, 6; | |
mul.wide.u32 %rd1145, %r5972, 1792; | |
add.s64 %rd1146, %rd414, %rd1145; | |
mul.wide.u32 %rd1147, %r5973, 28; | |
add.s64 %rd1148, %rd1146, %rd1147; | |
ld.global.u32 %r5974, [%rd1148]; | |
and.b32 %r5975, %r5974, 65535; | |
shl.b32 %r5976, %r5975, 6; | |
bfe.u32 %r5977, %r5974, 16, 6; | |
or.b32 %r703, %r5976, %r5977; | |
st.local.u32 [%rd2+384], %r703; | |
bfe.u32 %r5978, %r5971, 22, 6; | |
mul.wide.u32 %rd1149, %r5978, 28; | |
add.s64 %rd1150, %rd1146, %rd1149; | |
ld.global.u32 %r5979, [%rd1150]; | |
and.b32 %r5980, %r5979, 65535; | |
shl.b32 %r5981, %r5980, 6; | |
bfe.u32 %r5982, %r5979, 16, 6; | |
or.b32 %r13858, %r5981, %r5982; | |
st.local.u32 [%rd2+388], %r13858; | |
setp.le.u32 %p101, %r703, %r13858; | |
mov.u32 %r13857, %r703; | |
@%p101 bra BB12_198; | |
st.local.v2.u32 [%rd2+384], {%r13858, %r703}; | |
mov.u32 %r12581, %r13858; | |
mov.u32 %r13858, %r703; | |
mov.u32 %r13857, %r12581; | |
BB12_198: | |
mov.u32 %r13853, %r13857; | |
mov.u32 %r13854, %r13858; | |
bfe.u32 %r5983, %r702, 22, 6; | |
mul.lo.s64 %rd1151, %rd67, 1792; | |
add.s64 %rd1152, %rd415, %rd1151; | |
mul.wide.u32 %rd1153, %r5983, 28; | |
add.s64 %rd1154, %rd1152, %rd1153; | |
ld.global.u32 %r5984, [%rd1154]; | |
and.b32 %r5985, %r5984, 65535; | |
bfe.u32 %r5986, %r5984, 16, 6; | |
mul.wide.u32 %rd1155, %r5985, 1792; | |
add.s64 %rd1156, %rd414, %rd1155; | |
mul.wide.u32 %rd1157, %r5986, 28; | |
add.s64 %rd1158, %rd1156, %rd1157; | |
ld.global.u32 %r5987, [%rd1158]; | |
and.b32 %r5988, %r5987, 65535; | |
shl.b32 %r5989, %r5988, 6; | |
bfe.u32 %r5990, %r5987, 16, 6; | |
or.b32 %r707, %r5989, %r5990; | |
st.local.u32 [%rd2+392], %r707; | |
bfe.u32 %r5991, %r5984, 22, 6; | |
mul.wide.u32 %rd1159, %r5991, 28; | |
add.s64 %rd1160, %rd1156, %rd1159; | |
ld.global.u32 %r5992, [%rd1160]; | |
and.b32 %r5993, %r5992, 65535; | |
shl.b32 %r5994, %r5993, 6; | |
bfe.u32 %r5995, %r5992, 16, 6; | |
or.b32 %r13860, %r5994, %r5995; | |
st.local.u32 [%rd2+396], %r13860; | |
setp.le.u32 %p102, %r707, %r13860; | |
mov.u32 %r13859, %r707; | |
@%p102 bra BB12_200; | |
st.local.v2.u32 [%rd2+392], {%r13860, %r707}; | |
mov.u32 %r12587, %r13860; | |
mov.u32 %r13860, %r707; | |
mov.u32 %r13859, %r12587; | |
BB12_200: | |
mov.u32 %r710, %r13859; | |
mov.u32 %r709, %r13860; | |
setp.le.u32 %p103, %r13853, %r710; | |
mov.u32 %r13855, %r710; | |
mov.u32 %r13856, %r709; | |
@%p103 bra BB12_202; | |
st.local.v4.u32 [%rd2+384], {%r710, %r709, %r13853, %r13854}; | |
mov.u32 %r12584, %r13854; | |
mov.u32 %r12586, %r13853; | |
mov.u32 %r13854, %r709; | |
mov.u32 %r13853, %r710; | |
mov.u32 %r13855, %r12586; | |
mov.u32 %r13856, %r12584; | |
BB12_202: | |
mov.u32 %r13845, %r13853; | |
mov.u32 %r13846, %r13854; | |
mov.u32 %r13847, %r13855; | |
mov.u32 %r13848, %r13856; | |
mul.lo.s64 %rd1161, %rd66, 1792; | |
add.s64 %rd1162, %rd4, %rd1161; | |
bfe.u32 %r5996, %r701, 22, 6; | |
mul.wide.u32 %rd1163, %r5996, 28; | |
add.s64 %rd1164, %rd1162, %rd1163; | |
ld.global.u32 %r715, [%rd1164+-12]; | |
and.b32 %r5997, %r715, 65535; | |
cvt.u64.u32 %rd68, %r5997; | |
bfe.u32 %r5998, %r715, 16, 6; | |
mul.wide.u32 %rd1165, %r5997, 1792; | |
add.s64 %rd1166, %rd415, %rd1165; | |
mul.wide.u32 %rd1167, %r5998, 28; | |
add.s64 %rd1168, %rd1166, %rd1167; | |
ld.global.u32 %r5999, [%rd1168]; | |
and.b32 %r6000, %r5999, 65535; | |
bfe.u32 %r6001, %r5999, 16, 6; | |
mul.wide.u32 %rd1169, %r6000, 1792; | |
add.s64 %rd1170, %rd414, %rd1169; | |
mul.wide.u32 %rd1171, %r6001, 28; | |
add.s64 %rd1172, %rd1170, %rd1171; | |
ld.global.u32 %r6002, [%rd1172]; | |
and.b32 %r6003, %r6002, 65535; | |
shl.b32 %r6004, %r6003, 6; | |
bfe.u32 %r6005, %r6002, 16, 6; | |
or.b32 %r716, %r6004, %r6005; | |
st.local.u32 [%rd2+400], %r716; | |
bfe.u32 %r6006, %r5999, 22, 6; | |
mul.wide.u32 %rd1173, %r6006, 28; | |
add.s64 %rd1174, %rd1170, %rd1173; | |
ld.global.u32 %r6007, [%rd1174]; | |
and.b32 %r6008, %r6007, 65535; | |
shl.b32 %r6009, %r6008, 6; | |
bfe.u32 %r6010, %r6007, 16, 6; | |
or.b32 %r13866, %r6009, %r6010; | |
st.local.u32 [%rd2+404], %r13866; | |
setp.le.u32 %p104, %r716, %r13866; | |
mov.u32 %r13865, %r716; | |
@%p104 bra BB12_204; | |
st.local.v2.u32 [%rd2+400], {%r13866, %r716}; | |
mov.u32 %r12601, %r13866; | |
mov.u32 %r13866, %r716; | |
mov.u32 %r13865, %r12601; | |
BB12_204: | |
mov.u32 %r13861, %r13865; | |
mov.u32 %r13862, %r13866; | |
bfe.u32 %r6011, %r715, 22, 6; | |
mul.lo.s64 %rd1175, %rd68, 1792; | |
add.s64 %rd1176, %rd415, %rd1175; | |
mul.wide.u32 %rd1177, %r6011, 28; | |
add.s64 %rd1178, %rd1176, %rd1177; | |
ld.global.u32 %r6012, [%rd1178]; | |
and.b32 %r6013, %r6012, 65535; | |
bfe.u32 %r6014, %r6012, 16, 6; | |
mul.wide.u32 %rd1179, %r6013, 1792; | |
add.s64 %rd1180, %rd414, %rd1179; | |
mul.wide.u32 %rd1181, %r6014, 28; | |
add.s64 %rd1182, %rd1180, %rd1181; | |
ld.global.u32 %r6015, [%rd1182]; | |
and.b32 %r6016, %r6015, 65535; | |
shl.b32 %r6017, %r6016, 6; | |
bfe.u32 %r6018, %r6015, 16, 6; | |
or.b32 %r720, %r6017, %r6018; | |
st.local.u32 [%rd2+408], %r720; | |
bfe.u32 %r6019, %r6012, 22, 6; | |
mul.wide.u32 %rd1183, %r6019, 28; | |
add.s64 %rd1184, %rd1180, %rd1183; | |
ld.global.u32 %r6020, [%rd1184]; | |
and.b32 %r6021, %r6020, 65535; | |
shl.b32 %r6022, %r6021, 6; | |
bfe.u32 %r6023, %r6020, 16, 6; | |
or.b32 %r13868, %r6022, %r6023; | |
st.local.u32 [%rd2+412], %r13868; | |
setp.le.u32 %p105, %r720, %r13868; | |
mov.u32 %r13867, %r720; | |
@%p105 bra BB12_206; | |
st.local.v2.u32 [%rd2+408], {%r13868, %r720}; | |
mov.u32 %r12607, %r13868; | |
mov.u32 %r13868, %r720; | |
mov.u32 %r13867, %r12607; | |
BB12_206: | |
mov.u32 %r723, %r13867; | |
mov.u32 %r722, %r13868; | |
setp.le.u32 %p106, %r13861, %r723; | |
mov.u32 %r13863, %r723; | |
mov.u32 %r13864, %r722; | |
@%p106 bra BB12_208; | |
st.local.v4.u32 [%rd2+400], {%r723, %r722, %r13861, %r13862}; | |
mov.u32 %r12604, %r13862; | |
mov.u32 %r12606, %r13861; | |
mov.u32 %r13862, %r722; | |
mov.u32 %r13861, %r723; | |
mov.u32 %r13863, %r12606; | |
mov.u32 %r13864, %r12604; | |
BB12_208: | |
mov.u32 %r727, %r13861; | |
mov.u32 %r726, %r13862; | |
mov.u32 %r725, %r13863; | |
mov.u32 %r724, %r13864; | |
setp.le.u32 %p107, %r13845, %r727; | |
mov.u32 %r13849, %r727; | |
mov.u32 %r13850, %r726; | |
mov.u32 %r13851, %r725; | |
mov.u32 %r13852, %r724; | |
@%p107 bra BB12_210; | |
st.local.v4.u32 [%rd2+384], {%r727, %r726, %r725, %r724}; | |
st.local.v4.u32 [%rd2+400], {%r13845, %r13846, %r13847, %r13848}; | |
mov.u32 %r12594, %r13848; | |
mov.u32 %r12596, %r13847; | |
mov.u32 %r12598, %r13846; | |
mov.u32 %r12600, %r13845; | |
mov.u32 %r13848, %r724; | |
mov.u32 %r13847, %r725; | |
mov.u32 %r13846, %r726; | |
mov.u32 %r13845, %r727; | |
mov.u32 %r13849, %r12600; | |
mov.u32 %r13850, %r12598; | |
mov.u32 %r13851, %r12596; | |
mov.u32 %r13852, %r12594; | |
BB12_210: | |
mov.u32 %r13829, %r13845; | |
mov.u32 %r13830, %r13846; | |
mov.u32 %r13831, %r13847; | |
mov.u32 %r13832, %r13848; | |
mov.u32 %r13833, %r13849; | |
mov.u32 %r13834, %r13850; | |
mov.u32 %r13835, %r13851; | |
mov.u32 %r13836, %r13852; | |
mul.lo.s64 %rd1185, %rd65, 1792; | |
add.s64 %rd1186, %rd6, %rd1185; | |
bfe.u32 %r6024, %r700, 22, 6; | |
mul.wide.u32 %rd1187, %r6024, 28; | |
add.s64 %rd1188, %rd1186, %rd1187; | |
ld.global.u32 %r736, [%rd1188+-8]; | |
and.b32 %r6025, %r736, 65535; | |
mul.wide.u32 %rd1189, %r6025, 1792; | |
add.s64 %rd1190, %rd4, %rd1189; | |
cvt.u64.u32 %rd69, %r6025; | |
bfe.u32 %r6026, %r736, 16, 6; | |
mul.wide.u32 %rd1191, %r6026, 28; | |
add.s64 %rd1192, %rd1190, %rd1191; | |
ld.global.u32 %r737, [%rd1192+-12]; | |
and.b32 %r6027, %r737, 65535; | |
cvt.u64.u32 %rd70, %r6027; | |
bfe.u32 %r6028, %r737, 16, 6; | |
mul.wide.u32 %rd1193, %r6027, 1792; | |
add.s64 %rd1194, %rd415, %rd1193; | |
mul.wide.u32 %rd1195, %r6028, 28; | |
add.s64 %rd1196, %rd1194, %rd1195; | |
ld.global.u32 %r6029, [%rd1196]; | |
and.b32 %r6030, %r6029, 65535; | |
bfe.u32 %r6031, %r6029, 16, 6; | |
mul.wide.u32 %rd1197, %r6030, 1792; | |
add.s64 %rd1198, %rd414, %rd1197; | |
mul.wide.u32 %rd1199, %r6031, 28; | |
add.s64 %rd1200, %rd1198, %rd1199; | |
ld.global.u32 %r6032, [%rd1200]; | |
and.b32 %r6033, %r6032, 65535; | |
shl.b32 %r6034, %r6033, 6; | |
bfe.u32 %r6035, %r6032, 16, 6; | |
or.b32 %r738, %r6034, %r6035; | |
st.local.u32 [%rd2+416], %r738; | |
bfe.u32 %r6036, %r6029, 22, 6; | |
mul.wide.u32 %rd1201, %r6036, 28; | |
add.s64 %rd1202, %rd1198, %rd1201; | |
ld.global.u32 %r6037, [%rd1202]; | |
and.b32 %r6038, %r6037, 65535; | |
shl.b32 %r6039, %r6038, 6; | |
bfe.u32 %r6040, %r6037, 16, 6; | |
or.b32 %r13882, %r6039, %r6040; | |
st.local.u32 [%rd2+420], %r13882; | |
setp.le.u32 %p108, %r738, %r13882; | |
mov.u32 %r13881, %r738; | |
@%p108 bra BB12_212; | |
st.local.v2.u32 [%rd2+416], {%r13882, %r738}; | |
mov.u32 %r12637, %r13882; | |
mov.u32 %r13882, %r738; | |
mov.u32 %r13881, %r12637; | |
BB12_212: | |
mov.u32 %r13877, %r13881; | |
mov.u32 %r13878, %r13882; | |
bfe.u32 %r6041, %r737, 22, 6; | |
mul.lo.s64 %rd1203, %rd70, 1792; | |
add.s64 %rd1204, %rd415, %rd1203; | |
mul.wide.u32 %rd1205, %r6041, 28; | |
add.s64 %rd1206, %rd1204, %rd1205; | |
ld.global.u32 %r6042, [%rd1206]; | |
and.b32 %r6043, %r6042, 65535; | |
bfe.u32 %r6044, %r6042, 16, 6; | |
mul.wide.u32 %rd1207, %r6043, 1792; | |
add.s64 %rd1208, %rd414, %rd1207; | |
mul.wide.u32 %rd1209, %r6044, 28; | |
add.s64 %rd1210, %rd1208, %rd1209; | |
ld.global.u32 %r6045, [%rd1210]; | |
and.b32 %r6046, %r6045, 65535; | |
shl.b32 %r6047, %r6046, 6; | |
bfe.u32 %r6048, %r6045, 16, 6; | |
or.b32 %r742, %r6047, %r6048; | |
st.local.u32 [%rd2+424], %r742; | |
bfe.u32 %r6049, %r6042, 22, 6; | |
mul.wide.u32 %rd1211, %r6049, 28; | |
add.s64 %rd1212, %rd1208, %rd1211; | |
ld.global.u32 %r6050, [%rd1212]; | |
and.b32 %r6051, %r6050, 65535; | |
shl.b32 %r6052, %r6051, 6; | |
bfe.u32 %r6053, %r6050, 16, 6; | |
or.b32 %r13884, %r6052, %r6053; | |
st.local.u32 [%rd2+428], %r13884; | |
setp.le.u32 %p109, %r742, %r13884; | |
mov.u32 %r13883, %r742; | |
@%p109 bra BB12_214; | |
st.local.v2.u32 [%rd2+424], {%r13884, %r742}; | |
mov.u32 %r12643, %r13884; | |
mov.u32 %r13884, %r742; | |
mov.u32 %r13883, %r12643; | |
BB12_214: | |
mov.u32 %r745, %r13883; | |
mov.u32 %r744, %r13884; | |
setp.le.u32 %p110, %r13877, %r745; | |
mov.u32 %r13879, %r745; | |
mov.u32 %r13880, %r744; | |
@%p110 bra BB12_216; | |
st.local.v4.u32 [%rd2+416], {%r745, %r744, %r13877, %r13878}; | |
mov.u32 %r12640, %r13878; | |
mov.u32 %r12642, %r13877; | |
mov.u32 %r13878, %r744; | |
mov.u32 %r13877, %r745; | |
mov.u32 %r13879, %r12642; | |
mov.u32 %r13880, %r12640; | |
BB12_216: | |
mov.u32 %r13869, %r13877; | |
mov.u32 %r13870, %r13878; | |
mov.u32 %r13871, %r13879; | |
mov.u32 %r13872, %r13880; | |
mul.lo.s64 %rd1213, %rd69, 1792; | |
add.s64 %rd1214, %rd4, %rd1213; | |
bfe.u32 %r6054, %r736, 22, 6; | |
mul.wide.u32 %rd1215, %r6054, 28; | |
add.s64 %rd1216, %rd1214, %rd1215; | |
ld.global.u32 %r750, [%rd1216+-12]; | |
and.b32 %r6055, %r750, 65535; | |
cvt.u64.u32 %rd71, %r6055; | |
bfe.u32 %r6056, %r750, 16, 6; | |
mul.wide.u32 %rd1217, %r6055, 1792; | |
add.s64 %rd1218, %rd415, %rd1217; | |
mul.wide.u32 %rd1219, %r6056, 28; | |
add.s64 %rd1220, %rd1218, %rd1219; | |
ld.global.u32 %r6057, [%rd1220]; | |
and.b32 %r6058, %r6057, 65535; | |
bfe.u32 %r6059, %r6057, 16, 6; | |
mul.wide.u32 %rd1221, %r6058, 1792; | |
add.s64 %rd1222, %rd414, %rd1221; | |
mul.wide.u32 %rd1223, %r6059, 28; | |
add.s64 %rd1224, %rd1222, %rd1223; | |
ld.global.u32 %r6060, [%rd1224]; | |
and.b32 %r6061, %r6060, 65535; | |
shl.b32 %r6062, %r6061, 6; | |
bfe.u32 %r6063, %r6060, 16, 6; | |
or.b32 %r751, %r6062, %r6063; | |
st.local.u32 [%rd2+432], %r751; | |
bfe.u32 %r6064, %r6057, 22, 6; | |
mul.wide.u32 %rd1225, %r6064, 28; | |
add.s64 %rd1226, %rd1222, %rd1225; | |
ld.global.u32 %r6065, [%rd1226]; | |
and.b32 %r6066, %r6065, 65535; | |
shl.b32 %r6067, %r6066, 6; | |
bfe.u32 %r6068, %r6065, 16, 6; | |
or.b32 %r13890, %r6067, %r6068; | |
st.local.u32 [%rd2+436], %r13890; | |
setp.le.u32 %p111, %r751, %r13890; | |
mov.u32 %r13889, %r751; | |
@%p111 bra BB12_218; | |
st.local.v2.u32 [%rd2+432], {%r13890, %r751}; | |
mov.u32 %r12657, %r13890; | |
mov.u32 %r13890, %r751; | |
mov.u32 %r13889, %r12657; | |
BB12_218: | |
mov.u32 %r13885, %r13889; | |
mov.u32 %r13886, %r13890; | |
bfe.u32 %r6069, %r750, 22, 6; | |
mul.lo.s64 %rd1227, %rd71, 1792; | |
add.s64 %rd1228, %rd415, %rd1227; | |
mul.wide.u32 %rd1229, %r6069, 28; | |
add.s64 %rd1230, %rd1228, %rd1229; | |
ld.global.u32 %r6070, [%rd1230]; | |
and.b32 %r6071, %r6070, 65535; | |
bfe.u32 %r6072, %r6070, 16, 6; | |
mul.wide.u32 %rd1231, %r6071, 1792; | |
add.s64 %rd1232, %rd414, %rd1231; | |
mul.wide.u32 %rd1233, %r6072, 28; | |
add.s64 %rd1234, %rd1232, %rd1233; | |
ld.global.u32 %r6073, [%rd1234]; | |
and.b32 %r6074, %r6073, 65535; | |
shl.b32 %r6075, %r6074, 6; | |
bfe.u32 %r6076, %r6073, 16, 6; | |
or.b32 %r755, %r6075, %r6076; | |
st.local.u32 [%rd2+440], %r755; | |
bfe.u32 %r6077, %r6070, 22, 6; | |
mul.wide.u32 %rd1235, %r6077, 28; | |
add.s64 %rd1236, %rd1232, %rd1235; | |
ld.global.u32 %r6078, [%rd1236]; | |
and.b32 %r6079, %r6078, 65535; | |
shl.b32 %r6080, %r6079, 6; | |
bfe.u32 %r6081, %r6078, 16, 6; | |
or.b32 %r13892, %r6080, %r6081; | |
st.local.u32 [%rd2+444], %r13892; | |
setp.le.u32 %p112, %r755, %r13892; | |
mov.u32 %r13891, %r755; | |
@%p112 bra BB12_220; | |
st.local.v2.u32 [%rd2+440], {%r13892, %r755}; | |
mov.u32 %r12663, %r13892; | |
mov.u32 %r13892, %r755; | |
mov.u32 %r13891, %r12663; | |
BB12_220: | |
mov.u32 %r758, %r13891; | |
mov.u32 %r757, %r13892; | |
setp.le.u32 %p113, %r13885, %r758; | |
mov.u32 %r13887, %r758; | |
mov.u32 %r13888, %r757; | |
@%p113 bra BB12_222; | |
st.local.v4.u32 [%rd2+432], {%r758, %r757, %r13885, %r13886}; | |
mov.u32 %r12660, %r13886; | |
mov.u32 %r12662, %r13885; | |
mov.u32 %r13886, %r757; | |
mov.u32 %r13885, %r758; | |
mov.u32 %r13887, %r12662; | |
mov.u32 %r13888, %r12660; | |
BB12_222: | |
mov.u32 %r762, %r13885; | |
mov.u32 %r761, %r13886; | |
mov.u32 %r760, %r13887; | |
mov.u32 %r759, %r13888; | |
setp.le.u32 %p114, %r13869, %r762; | |
mov.u32 %r13873, %r762; | |
mov.u32 %r13874, %r761; | |
mov.u32 %r13875, %r760; | |
mov.u32 %r13876, %r759; | |
@%p114 bra BB12_224; | |
st.local.v4.u32 [%rd2+416], {%r762, %r761, %r760, %r759}; | |
st.local.v4.u32 [%rd2+432], {%r13869, %r13870, %r13871, %r13872}; | |
mov.u32 %r12650, %r13872; | |
mov.u32 %r12652, %r13871; | |
mov.u32 %r12654, %r13870; | |
mov.u32 %r12656, %r13869; | |
mov.u32 %r13872, %r759; | |
mov.u32 %r13871, %r760; | |
mov.u32 %r13870, %r761; | |
mov.u32 %r13869, %r762; | |
mov.u32 %r13873, %r12656; | |
mov.u32 %r13874, %r12654; | |
mov.u32 %r13875, %r12652; | |
mov.u32 %r13876, %r12650; | |
BB12_224: | |
mov.u32 %r770, %r13869; | |
mov.u32 %r769, %r13870; | |
mov.u32 %r768, %r13871; | |
mov.u32 %r767, %r13872; | |
mov.u32 %r766, %r13873; | |
mov.u32 %r765, %r13874; | |
mov.u32 %r764, %r13875; | |
mov.u32 %r763, %r13876; | |
setp.le.u32 %p115, %r13829, %r770; | |
mov.u32 %r13837, %r770; | |
mov.u32 %r13838, %r769; | |
mov.u32 %r13839, %r768; | |
mov.u32 %r13840, %r767; | |
mov.u32 %r13841, %r766; | |
mov.u32 %r13842, %r765; | |
mov.u32 %r13843, %r764; | |
mov.u32 %r13844, %r763; | |
@%p115 bra BB12_226; | |
st.local.v4.u32 [%rd2+384], {%r770, %r769, %r768, %r767}; | |
st.local.v4.u32 [%rd2+416], {%r13829, %r13830, %r13831, %r13832}; | |
st.local.v4.u32 [%rd2+400], {%r766, %r765, %r764, %r763}; | |
st.local.v4.u32 [%rd2+432], {%r13833, %r13834, %r13835, %r13836}; | |
mov.u32 %r12622, %r13836; | |
mov.u32 %r12624, %r13835; | |
mov.u32 %r12626, %r13834; | |
mov.u32 %r12628, %r13833; | |
mov.u32 %r12630, %r13832; | |
mov.u32 %r12632, %r13831; | |
mov.u32 %r12634, %r13830; | |
mov.u32 %r12636, %r13829; | |
mov.u32 %r13836, %r763; | |
mov.u32 %r13835, %r764; | |
mov.u32 %r13834, %r765; | |
mov.u32 %r13833, %r766; | |
mov.u32 %r13832, %r767; | |
mov.u32 %r13831, %r768; | |
mov.u32 %r13830, %r769; | |
mov.u32 %r13829, %r770; | |
mov.u32 %r13837, %r12636; | |
mov.u32 %r13838, %r12634; | |
mov.u32 %r13839, %r12632; | |
mov.u32 %r13840, %r12630; | |
mov.u32 %r13841, %r12628; | |
mov.u32 %r13842, %r12626; | |
mov.u32 %r13843, %r12624; | |
mov.u32 %r13844, %r12622; | |
BB12_226: | |
mov.u32 %r13797, %r13829; | |
mov.u32 %r13798, %r13830; | |
mov.u32 %r13799, %r13831; | |
mov.u32 %r13800, %r13832; | |
mov.u32 %r13801, %r13833; | |
mov.u32 %r13802, %r13834; | |
mov.u32 %r13803, %r13835; | |
mov.u32 %r13804, %r13836; | |
mov.u32 %r13805, %r13837; | |
mov.u32 %r13806, %r13838; | |
mov.u32 %r13807, %r13839; | |
mov.u32 %r13808, %r13840; | |
mov.u32 %r13809, %r13841; | |
mov.u32 %r13810, %r13842; | |
mov.u32 %r13811, %r13843; | |
mov.u32 %r13812, %r13844; | |
mul.lo.s64 %rd1237, %rd64, 1792; | |
add.s64 %rd1238, %rd4, %rd1237; | |
bfe.u32 %r6082, %r699, 22, 6; | |
mul.wide.u32 %rd1239, %r6082, 28; | |
add.s64 %rd1240, %rd1238, %rd1239; | |
ld.global.u32 %r787, [%rd1240+-8]; | |
and.b32 %r6083, %r787, 65535; | |
mul.wide.u32 %rd1241, %r6083, 1792; | |
add.s64 %rd1242, %rd6, %rd1241; | |
bfe.u32 %r6084, %r787, 16, 6; | |
mul.wide.u32 %rd1243, %r6084, 28; | |
add.s64 %rd1244, %rd1242, %rd1243; | |
ld.global.u32 %r788, [%rd1244+-8]; | |
and.b32 %r6085, %r788, 65535; | |
mul.wide.u32 %rd1245, %r6085, 1792; | |
add.s64 %rd1246, %rd4, %rd1245; | |
cvt.u64.u32 %rd72, %r6083; | |
cvt.u64.u32 %rd73, %r6085; | |
bfe.u32 %r6086, %r788, 16, 6; | |
mul.wide.u32 %rd1247, %r6086, 28; | |
add.s64 %rd1248, %rd1246, %rd1247; | |
ld.global.u32 %r789, [%rd1248+-12]; | |
and.b32 %r6087, %r789, 65535; | |
cvt.u64.u32 %rd74, %r6087; | |
bfe.u32 %r6088, %r789, 16, 6; | |
mul.wide.u32 %rd1249, %r6087, 1792; | |
add.s64 %rd1250, %rd415, %rd1249; | |
mul.wide.u32 %rd1251, %r6088, 28; | |
add.s64 %rd1252, %rd1250, %rd1251; | |
ld.global.u32 %r6089, [%rd1252]; | |
and.b32 %r6090, %r6089, 65535; | |
bfe.u32 %r6091, %r6089, 16, 6; | |
mul.wide.u32 %rd1253, %r6090, 1792; | |
add.s64 %rd1254, %rd414, %rd1253; | |
mul.wide.u32 %rd1255, %r6091, 28; | |
add.s64 %rd1256, %rd1254, %rd1255; | |
ld.global.u32 %r6092, [%rd1256]; | |
and.b32 %r6093, %r6092, 65535; | |
shl.b32 %r6094, %r6093, 6; | |
bfe.u32 %r6095, %r6092, 16, 6; | |
or.b32 %r790, %r6094, %r6095; | |
st.local.u32 [%rd2+448], %r790; | |
bfe.u32 %r6096, %r6089, 22, 6; | |
mul.wide.u32 %rd1257, %r6096, 28; | |
add.s64 %rd1258, %rd1254, %rd1257; | |
ld.global.u32 %r6097, [%rd1258]; | |
and.b32 %r6098, %r6097, 65535; | |
shl.b32 %r6099, %r6098, 6; | |
bfe.u32 %r6100, %r6097, 16, 6; | |
or.b32 %r13922, %r6099, %r6100; | |
st.local.u32 [%rd2+452], %r13922; | |
setp.le.u32 %p116, %r790, %r13922; | |
mov.u32 %r13921, %r790; | |
@%p116 bra BB12_228; | |
st.local.v2.u32 [%rd2+448], {%r13922, %r790}; | |
mov.u32 %r12725, %r13922; | |
mov.u32 %r13922, %r790; | |
mov.u32 %r13921, %r12725; | |
BB12_228: | |
mov.u32 %r13917, %r13921; | |
mov.u32 %r13918, %r13922; | |
bfe.u32 %r6101, %r789, 22, 6; | |
mul.lo.s64 %rd1259, %rd74, 1792; | |
add.s64 %rd1260, %rd415, %rd1259; | |
mul.wide.u32 %rd1261, %r6101, 28; | |
add.s64 %rd1262, %rd1260, %rd1261; | |
ld.global.u32 %r6102, [%rd1262]; | |
and.b32 %r6103, %r6102, 65535; | |
bfe.u32 %r6104, %r6102, 16, 6; | |
mul.wide.u32 %rd1263, %r6103, 1792; | |
add.s64 %rd1264, %rd414, %rd1263; | |
mul.wide.u32 %rd1265, %r6104, 28; | |
add.s64 %rd1266, %rd1264, %rd1265; | |
ld.global.u32 %r6105, [%rd1266]; | |
and.b32 %r6106, %r6105, 65535; | |
shl.b32 %r6107, %r6106, 6; | |
bfe.u32 %r6108, %r6105, 16, 6; | |
or.b32 %r794, %r6107, %r6108; | |
st.local.u32 [%rd2+456], %r794; | |
bfe.u32 %r6109, %r6102, 22, 6; | |
mul.wide.u32 %rd1267, %r6109, 28; | |
add.s64 %rd1268, %rd1264, %rd1267; | |
ld.global.u32 %r6110, [%rd1268]; | |
and.b32 %r6111, %r6110, 65535; | |
shl.b32 %r6112, %r6111, 6; | |
bfe.u32 %r6113, %r6110, 16, 6; | |
or.b32 %r13924, %r6112, %r6113; | |
st.local.u32 [%rd2+460], %r13924; | |
setp.le.u32 %p117, %r794, %r13924; | |
mov.u32 %r13923, %r794; | |
@%p117 bra BB12_230; | |
st.local.v2.u32 [%rd2+456], {%r13924, %r794}; | |
mov.u32 %r12731, %r13924; | |
mov.u32 %r13924, %r794; | |
mov.u32 %r13923, %r12731; | |
BB12_230: | |
mov.u32 %r797, %r13923; | |
mov.u32 %r796, %r13924; | |
setp.le.u32 %p118, %r13917, %r797; | |
mov.u32 %r13919, %r797; | |
mov.u32 %r13920, %r796; | |
@%p118 bra BB12_232; | |
st.local.v4.u32 [%rd2+448], {%r797, %r796, %r13917, %r13918}; | |
mov.u32 %r12728, %r13918; | |
mov.u32 %r12730, %r13917; | |
mov.u32 %r13918, %r796; | |
mov.u32 %r13917, %r797; | |
mov.u32 %r13919, %r12730; | |
mov.u32 %r13920, %r12728; | |
BB12_232: | |
mov.u32 %r13909, %r13917; | |
mov.u32 %r13910, %r13918; | |
mov.u32 %r13911, %r13919; | |
mov.u32 %r13912, %r13920; | |
mul.lo.s64 %rd1269, %rd73, 1792; | |
add.s64 %rd1270, %rd4, %rd1269; | |
bfe.u32 %r6114, %r788, 22, 6; | |
mul.wide.u32 %rd1271, %r6114, 28; | |
add.s64 %rd1272, %rd1270, %rd1271; | |
ld.global.u32 %r802, [%rd1272+-12]; | |
and.b32 %r6115, %r802, 65535; | |
cvt.u64.u32 %rd75, %r6115; | |
bfe.u32 %r6116, %r802, 16, 6; | |
mul.wide.u32 %rd1273, %r6115, 1792; | |
add.s64 %rd1274, %rd415, %rd1273; | |
mul.wide.u32 %rd1275, %r6116, 28; | |
add.s64 %rd1276, %rd1274, %rd1275; | |
ld.global.u32 %r6117, [%rd1276]; | |
and.b32 %r6118, %r6117, 65535; | |
bfe.u32 %r6119, %r6117, 16, 6; | |
mul.wide.u32 %rd1277, %r6118, 1792; | |
add.s64 %rd1278, %rd414, %rd1277; | |
mul.wide.u32 %rd1279, %r6119, 28; | |
add.s64 %rd1280, %rd1278, %rd1279; | |
ld.global.u32 %r6120, [%rd1280]; | |
and.b32 %r6121, %r6120, 65535; | |
shl.b32 %r6122, %r6121, 6; | |
bfe.u32 %r6123, %r6120, 16, 6; | |
or.b32 %r803, %r6122, %r6123; | |
st.local.u32 [%rd2+464], %r803; | |
bfe.u32 %r6124, %r6117, 22, 6; | |
mul.wide.u32 %rd1281, %r6124, 28; | |
add.s64 %rd1282, %rd1278, %rd1281; | |
ld.global.u32 %r6125, [%rd1282]; | |
and.b32 %r6126, %r6125, 65535; | |
shl.b32 %r6127, %r6126, 6; | |
bfe.u32 %r6128, %r6125, 16, 6; | |
or.b32 %r13930, %r6127, %r6128; | |
st.local.u32 [%rd2+468], %r13930; | |
setp.le.u32 %p119, %r803, %r13930; | |
mov.u32 %r13929, %r803; | |
@%p119 bra BB12_234; | |
st.local.v2.u32 [%rd2+464], {%r13930, %r803}; | |
mov.u32 %r12745, %r13930; | |
mov.u32 %r13930, %r803; | |
mov.u32 %r13929, %r12745; | |
BB12_234: | |
mov.u32 %r13925, %r13929; | |
mov.u32 %r13926, %r13930; | |
bfe.u32 %r6129, %r802, 22, 6; | |
mul.lo.s64 %rd1283, %rd75, 1792; | |
add.s64 %rd1284, %rd415, %rd1283; | |
mul.wide.u32 %rd1285, %r6129, 28; | |
add.s64 %rd1286, %rd1284, %rd1285; | |
ld.global.u32 %r6130, [%rd1286]; | |
and.b32 %r6131, %r6130, 65535; | |
bfe.u32 %r6132, %r6130, 16, 6; | |
mul.wide.u32 %rd1287, %r6131, 1792; | |
add.s64 %rd1288, %rd414, %rd1287; | |
mul.wide.u32 %rd1289, %r6132, 28; | |
add.s64 %rd1290, %rd1288, %rd1289; | |
ld.global.u32 %r6133, [%rd1290]; | |
and.b32 %r6134, %r6133, 65535; | |
shl.b32 %r6135, %r6134, 6; | |
bfe.u32 %r6136, %r6133, 16, 6; | |
or.b32 %r807, %r6135, %r6136; | |
st.local.u32 [%rd2+472], %r807; | |
bfe.u32 %r6137, %r6130, 22, 6; | |
mul.wide.u32 %rd1291, %r6137, 28; | |
add.s64 %rd1292, %rd1288, %rd1291; | |
ld.global.u32 %r6138, [%rd1292]; | |
and.b32 %r6139, %r6138, 65535; | |
shl.b32 %r6140, %r6139, 6; | |
bfe.u32 %r6141, %r6138, 16, 6; | |
or.b32 %r13932, %r6140, %r6141; | |
st.local.u32 [%rd2+476], %r13932; | |
setp.le.u32 %p120, %r807, %r13932; | |
mov.u32 %r13931, %r807; | |
@%p120 bra BB12_236; | |
st.local.v2.u32 [%rd2+472], {%r13932, %r807}; | |
mov.u32 %r12751, %r13932; | |
mov.u32 %r13932, %r807; | |
mov.u32 %r13931, %r12751; | |
BB12_236: | |
mov.u32 %r810, %r13931; | |
mov.u32 %r809, %r13932; | |
setp.le.u32 %p121, %r13925, %r810; | |
mov.u32 %r13927, %r810; | |
mov.u32 %r13928, %r809; | |
@%p121 bra BB12_238; | |
st.local.v4.u32 [%rd2+464], {%r810, %r809, %r13925, %r13926}; | |
mov.u32 %r12748, %r13926; | |
mov.u32 %r12750, %r13925; | |
mov.u32 %r13926, %r809; | |
mov.u32 %r13925, %r810; | |
mov.u32 %r13927, %r12750; | |
mov.u32 %r13928, %r12748; | |
BB12_238: | |
mov.u32 %r814, %r13925; | |
mov.u32 %r813, %r13926; | |
mov.u32 %r812, %r13927; | |
mov.u32 %r811, %r13928; | |
setp.le.u32 %p122, %r13909, %r814; | |
mov.u32 %r13913, %r814; | |
mov.u32 %r13914, %r813; | |
mov.u32 %r13915, %r812; | |
mov.u32 %r13916, %r811; | |
@%p122 bra BB12_240; | |
st.local.v4.u32 [%rd2+448], {%r814, %r813, %r812, %r811}; | |
st.local.v4.u32 [%rd2+464], {%r13909, %r13910, %r13911, %r13912}; | |
mov.u32 %r12738, %r13912; | |
mov.u32 %r12740, %r13911; | |
mov.u32 %r12742, %r13910; | |
mov.u32 %r12744, %r13909; | |
mov.u32 %r13912, %r811; | |
mov.u32 %r13911, %r812; | |
mov.u32 %r13910, %r813; | |
mov.u32 %r13909, %r814; | |
mov.u32 %r13913, %r12744; | |
mov.u32 %r13914, %r12742; | |
mov.u32 %r13915, %r12740; | |
mov.u32 %r13916, %r12738; | |
BB12_240: | |
mov.u32 %r13893, %r13909; | |
mov.u32 %r13894, %r13910; | |
mov.u32 %r13895, %r13911; | |
mov.u32 %r13896, %r13912; | |
mov.u32 %r13897, %r13913; | |
mov.u32 %r13898, %r13914; | |
mov.u32 %r13899, %r13915; | |
mov.u32 %r13900, %r13916; | |
mul.lo.s64 %rd1293, %rd72, 1792; | |
add.s64 %rd1294, %rd6, %rd1293; | |
bfe.u32 %r6142, %r787, 22, 6; | |
mul.wide.u32 %rd1295, %r6142, 28; | |
add.s64 %rd1296, %rd1294, %rd1295; | |
ld.global.u32 %r823, [%rd1296+-8]; | |
and.b32 %r6143, %r823, 65535; | |
mul.wide.u32 %rd1297, %r6143, 1792; | |
add.s64 %rd1298, %rd4, %rd1297; | |
cvt.u64.u32 %rd76, %r6143; | |
bfe.u32 %r6144, %r823, 16, 6; | |
mul.wide.u32 %rd1299, %r6144, 28; | |
add.s64 %rd1300, %rd1298, %rd1299; | |
ld.global.u32 %r824, [%rd1300+-12]; | |
and.b32 %r6145, %r824, 65535; | |
cvt.u64.u32 %rd77, %r6145; | |
bfe.u32 %r6146, %r824, 16, 6; | |
mul.wide.u32 %rd1301, %r6145, 1792; | |
add.s64 %rd1302, %rd415, %rd1301; | |
mul.wide.u32 %rd1303, %r6146, 28; | |
add.s64 %rd1304, %rd1302, %rd1303; | |
ld.global.u32 %r6147, [%rd1304]; | |
and.b32 %r6148, %r6147, 65535; | |
bfe.u32 %r6149, %r6147, 16, 6; | |
mul.wide.u32 %rd1305, %r6148, 1792; | |
add.s64 %rd1306, %rd414, %rd1305; | |
mul.wide.u32 %rd1307, %r6149, 28; | |
add.s64 %rd1308, %rd1306, %rd1307; | |
ld.global.u32 %r6150, [%rd1308]; | |
and.b32 %r6151, %r6150, 65535; | |
shl.b32 %r6152, %r6151, 6; | |
bfe.u32 %r6153, %r6150, 16, 6; | |
or.b32 %r825, %r6152, %r6153; | |
st.local.u32 [%rd2+480], %r825; | |
bfe.u32 %r6154, %r6147, 22, 6; | |
mul.wide.u32 %rd1309, %r6154, 28; | |
add.s64 %rd1310, %rd1306, %rd1309; | |
ld.global.u32 %r6155, [%rd1310]; | |
and.b32 %r6156, %r6155, 65535; | |
shl.b32 %r6157, %r6156, 6; | |
bfe.u32 %r6158, %r6155, 16, 6; | |
or.b32 %r13946, %r6157, %r6158; | |
st.local.u32 [%rd2+484], %r13946; | |
setp.le.u32 %p123, %r825, %r13946; | |
mov.u32 %r13945, %r825; | |
@%p123 bra BB12_242; | |
st.local.v2.u32 [%rd2+480], {%r13946, %r825}; | |
mov.u32 %r12781, %r13946; | |
mov.u32 %r13946, %r825; | |
mov.u32 %r13945, %r12781; | |
BB12_242: | |
mov.u32 %r13941, %r13945; | |
mov.u32 %r13942, %r13946; | |
bfe.u32 %r6159, %r824, 22, 6; | |
mul.lo.s64 %rd1311, %rd77, 1792; | |
add.s64 %rd1312, %rd415, %rd1311; | |
mul.wide.u32 %rd1313, %r6159, 28; | |
add.s64 %rd1314, %rd1312, %rd1313; | |
ld.global.u32 %r6160, [%rd1314]; | |
and.b32 %r6161, %r6160, 65535; | |
bfe.u32 %r6162, %r6160, 16, 6; | |
mul.wide.u32 %rd1315, %r6161, 1792; | |
add.s64 %rd1316, %rd414, %rd1315; | |
mul.wide.u32 %rd1317, %r6162, 28; | |
add.s64 %rd1318, %rd1316, %rd1317; | |
ld.global.u32 %r6163, [%rd1318]; | |
and.b32 %r6164, %r6163, 65535; | |
shl.b32 %r6165, %r6164, 6; | |
bfe.u32 %r6166, %r6163, 16, 6; | |
or.b32 %r829, %r6165, %r6166; | |
st.local.u32 [%rd2+488], %r829; | |
bfe.u32 %r6167, %r6160, 22, 6; | |
mul.wide.u32 %rd1319, %r6167, 28; | |
add.s64 %rd1320, %rd1316, %rd1319; | |
ld.global.u32 %r6168, [%rd1320]; | |
and.b32 %r6169, %r6168, 65535; | |
shl.b32 %r6170, %r6169, 6; | |
bfe.u32 %r6171, %r6168, 16, 6; | |
or.b32 %r13948, %r6170, %r6171; | |
st.local.u32 [%rd2+492], %r13948; | |
setp.le.u32 %p124, %r829, %r13948; | |
mov.u32 %r13947, %r829; | |
@%p124 bra BB12_244; | |
st.local.v2.u32 [%rd2+488], {%r13948, %r829}; | |
mov.u32 %r12787, %r13948; | |
mov.u32 %r13948, %r829; | |
mov.u32 %r13947, %r12787; | |
BB12_244: | |
mov.u32 %r832, %r13947; | |
mov.u32 %r831, %r13948; | |
setp.le.u32 %p125, %r13941, %r832; | |
mov.u32 %r13943, %r832; | |
mov.u32 %r13944, %r831; | |
@%p125 bra BB12_246; | |
st.local.v4.u32 [%rd2+480], {%r832, %r831, %r13941, %r13942}; | |
mov.u32 %r12784, %r13942; | |
mov.u32 %r12786, %r13941; | |
mov.u32 %r13942, %r831; | |
mov.u32 %r13941, %r832; | |
mov.u32 %r13943, %r12786; | |
mov.u32 %r13944, %r12784; | |
BB12_246: | |
mov.u32 %r13933, %r13941; | |
mov.u32 %r13934, %r13942; | |
mov.u32 %r13935, %r13943; | |
mov.u32 %r13936, %r13944; | |
mul.lo.s64 %rd1321, %rd76, 1792; | |
add.s64 %rd1322, %rd4, %rd1321; | |
bfe.u32 %r6172, %r823, 22, 6; | |
mul.wide.u32 %rd1323, %r6172, 28; | |
add.s64 %rd1324, %rd1322, %rd1323; | |
ld.global.u32 %r837, [%rd1324+-12]; | |
and.b32 %r6173, %r837, 65535; | |
cvt.u64.u32 %rd78, %r6173; | |
bfe.u32 %r6174, %r837, 16, 6; | |
mul.wide.u32 %rd1325, %r6173, 1792; | |
add.s64 %rd1326, %rd415, %rd1325; | |
mul.wide.u32 %rd1327, %r6174, 28; | |
add.s64 %rd1328, %rd1326, %rd1327; | |
ld.global.u32 %r6175, [%rd1328]; | |
and.b32 %r6176, %r6175, 65535; | |
bfe.u32 %r6177, %r6175, 16, 6; | |
mul.wide.u32 %rd1329, %r6176, 1792; | |
add.s64 %rd1330, %rd414, %rd1329; | |
mul.wide.u32 %rd1331, %r6177, 28; | |
add.s64 %rd1332, %rd1330, %rd1331; | |
ld.global.u32 %r6178, [%rd1332]; | |
and.b32 %r6179, %r6178, 65535; | |
shl.b32 %r6180, %r6179, 6; | |
bfe.u32 %r6181, %r6178, 16, 6; | |
or.b32 %r838, %r6180, %r6181; | |
st.local.u32 [%rd2+496], %r838; | |
bfe.u32 %r6182, %r6175, 22, 6; | |
mul.wide.u32 %rd1333, %r6182, 28; | |
add.s64 %rd1334, %rd1330, %rd1333; | |
ld.global.u32 %r6183, [%rd1334]; | |
and.b32 %r6184, %r6183, 65535; | |
shl.b32 %r6185, %r6184, 6; | |
bfe.u32 %r6186, %r6183, 16, 6; | |
or.b32 %r13954, %r6185, %r6186; | |
st.local.u32 [%rd2+500], %r13954; | |
setp.le.u32 %p126, %r838, %r13954; | |
mov.u32 %r13953, %r838; | |
@%p126 bra BB12_248; | |
st.local.v2.u32 [%rd2+496], {%r13954, %r838}; | |
mov.u32 %r12801, %r13954; | |
mov.u32 %r13954, %r838; | |
mov.u32 %r13953, %r12801; | |
BB12_248: | |
mov.u32 %r13949, %r13953; | |
mov.u32 %r13950, %r13954; | |
bfe.u32 %r6187, %r837, 22, 6; | |
mul.lo.s64 %rd1335, %rd78, 1792; | |
add.s64 %rd1336, %rd415, %rd1335; | |
mul.wide.u32 %rd1337, %r6187, 28; | |
add.s64 %rd1338, %rd1336, %rd1337; | |
ld.global.u32 %r6188, [%rd1338]; | |
and.b32 %r6189, %r6188, 65535; | |
bfe.u32 %r6190, %r6188, 16, 6; | |
mul.wide.u32 %rd1339, %r6189, 1792; | |
add.s64 %rd1340, %rd414, %rd1339; | |
mul.wide.u32 %rd1341, %r6190, 28; | |
add.s64 %rd1342, %rd1340, %rd1341; | |
ld.global.u32 %r6191, [%rd1342]; | |
and.b32 %r6192, %r6191, 65535; | |
shl.b32 %r6193, %r6192, 6; | |
bfe.u32 %r6194, %r6191, 16, 6; | |
or.b32 %r842, %r6193, %r6194; | |
st.local.u32 [%rd2+504], %r842; | |
bfe.u32 %r6195, %r6188, 22, 6; | |
mul.wide.u32 %rd1343, %r6195, 28; | |
add.s64 %rd1344, %rd1340, %rd1343; | |
ld.global.u32 %r6196, [%rd1344]; | |
and.b32 %r6197, %r6196, 65535; | |
shl.b32 %r6198, %r6197, 6; | |
bfe.u32 %r6199, %r6196, 16, 6; | |
or.b32 %r13956, %r6198, %r6199; | |
st.local.u32 [%rd2+508], %r13956; | |
setp.le.u32 %p127, %r842, %r13956; | |
mov.u32 %r13955, %r842; | |
@%p127 bra BB12_250; | |
st.local.v2.u32 [%rd2+504], {%r13956, %r842}; | |
mov.u32 %r12807, %r13956; | |
mov.u32 %r13956, %r842; | |
mov.u32 %r13955, %r12807; | |
BB12_250: | |
mov.u32 %r845, %r13955; | |
mov.u32 %r844, %r13956; | |
setp.le.u32 %p128, %r13949, %r845; | |
mov.u32 %r13951, %r845; | |
mov.u32 %r13952, %r844; | |
@%p128 bra BB12_252; | |
st.local.v4.u32 [%rd2+496], {%r845, %r844, %r13949, %r13950}; | |
mov.u32 %r12804, %r13950; | |
mov.u32 %r12806, %r13949; | |
mov.u32 %r13950, %r844; | |
mov.u32 %r13949, %r845; | |
mov.u32 %r13951, %r12806; | |
mov.u32 %r13952, %r12804; | |
BB12_252: | |
mov.u32 %r849, %r13949; | |
mov.u32 %r848, %r13950; | |
mov.u32 %r847, %r13951; | |
mov.u32 %r846, %r13952; | |
setp.le.u32 %p129, %r13933, %r849; | |
mov.u32 %r13937, %r849; | |
mov.u32 %r13938, %r848; | |
mov.u32 %r13939, %r847; | |
mov.u32 %r13940, %r846; | |
@%p129 bra BB12_254; | |
st.local.v4.u32 [%rd2+480], {%r849, %r848, %r847, %r846}; | |
st.local.v4.u32 [%rd2+496], {%r13933, %r13934, %r13935, %r13936}; | |
mov.u32 %r12794, %r13936; | |
mov.u32 %r12796, %r13935; | |
mov.u32 %r12798, %r13934; | |
mov.u32 %r12800, %r13933; | |
mov.u32 %r13936, %r846; | |
mov.u32 %r13935, %r847; | |
mov.u32 %r13934, %r848; | |
mov.u32 %r13933, %r849; | |
mov.u32 %r13937, %r12800; | |
mov.u32 %r13938, %r12798; | |
mov.u32 %r13939, %r12796; | |
mov.u32 %r13940, %r12794; | |
BB12_254: | |
mov.u32 %r857, %r13933; | |
mov.u32 %r856, %r13934; | |
mov.u32 %r855, %r13935; | |
mov.u32 %r854, %r13936; | |
mov.u32 %r853, %r13937; | |
mov.u32 %r852, %r13938; | |
mov.u32 %r851, %r13939; | |
mov.u32 %r850, %r13940; | |
setp.le.u32 %p130, %r13893, %r857; | |
mov.u32 %r13901, %r857; | |
mov.u32 %r13902, %r856; | |
mov.u32 %r13903, %r855; | |
mov.u32 %r13904, %r854; | |
mov.u32 %r13905, %r853; | |
mov.u32 %r13906, %r852; | |
mov.u32 %r13907, %r851; | |
mov.u32 %r13908, %r850; | |
@%p130 bra BB12_256; | |
st.local.v4.u32 [%rd2+448], {%r857, %r856, %r855, %r854}; | |
st.local.v4.u32 [%rd2+480], {%r13893, %r13894, %r13895, %r13896}; | |
st.local.v4.u32 [%rd2+464], {%r853, %r852, %r851, %r850}; | |
st.local.v4.u32 [%rd2+496], {%r13897, %r13898, %r13899, %r13900}; | |
mov.u32 %r12766, %r13900; | |
mov.u32 %r12768, %r13899; | |
mov.u32 %r12770, %r13898; | |
mov.u32 %r12772, %r13897; | |
mov.u32 %r12774, %r13896; | |
mov.u32 %r12776, %r13895; | |
mov.u32 %r12778, %r13894; | |
mov.u32 %r12780, %r13893; | |
mov.u32 %r13900, %r850; | |
mov.u32 %r13899, %r851; | |
mov.u32 %r13898, %r852; | |
mov.u32 %r13897, %r853; | |
mov.u32 %r13896, %r854; | |
mov.u32 %r13895, %r855; | |
mov.u32 %r13894, %r856; | |
mov.u32 %r13893, %r857; | |
mov.u32 %r13901, %r12780; | |
mov.u32 %r13902, %r12778; | |
mov.u32 %r13903, %r12776; | |
mov.u32 %r13904, %r12774; | |
mov.u32 %r13905, %r12772; | |
mov.u32 %r13906, %r12770; | |
mov.u32 %r13907, %r12768; | |
mov.u32 %r13908, %r12766; | |
BB12_256: | |
mov.u32 %r873, %r13893; | |
mov.u32 %r872, %r13894; | |
mov.u32 %r871, %r13895; | |
mov.u32 %r870, %r13896; | |
mov.u32 %r869, %r13897; | |
mov.u32 %r868, %r13898; | |
mov.u32 %r867, %r13899; | |
mov.u32 %r866, %r13900; | |
mov.u32 %r865, %r13901; | |
mov.u32 %r864, %r13902; | |
mov.u32 %r863, %r13903; | |
mov.u32 %r862, %r13904; | |
mov.u32 %r861, %r13905; | |
mov.u32 %r860, %r13906; | |
mov.u32 %r859, %r13907; | |
mov.u32 %r858, %r13908; | |
setp.le.u32 %p131, %r13797, %r873; | |
mov.u32 %r13813, %r873; | |
mov.u32 %r13814, %r872; | |
mov.u32 %r13815, %r871; | |
mov.u32 %r13816, %r870; | |
mov.u32 %r13817, %r869; | |
mov.u32 %r13818, %r868; | |
mov.u32 %r13819, %r867; | |
mov.u32 %r13820, %r866; | |
mov.u32 %r13821, %r865; | |
mov.u32 %r13822, %r864; | |
mov.u32 %r13823, %r863; | |
mov.u32 %r13824, %r862; | |
mov.u32 %r13825, %r861; | |
mov.u32 %r13826, %r860; | |
mov.u32 %r13827, %r859; | |
mov.u32 %r13828, %r858; | |
@%p131 bra BB12_258; | |
st.local.v4.u32 [%rd2+384], {%r873, %r872, %r871, %r870}; | |
st.local.v4.u32 [%rd2+448], {%r13797, %r13798, %r13799, %r13800}; | |
st.local.v4.u32 [%rd2+400], {%r869, %r868, %r867, %r866}; | |
st.local.v4.u32 [%rd2+464], {%r13801, %r13802, %r13803, %r13804}; | |
st.local.v4.u32 [%rd2+416], {%r865, %r864, %r863, %r862}; | |
st.local.v4.u32 [%rd2+480], {%r13805, %r13806, %r13807, %r13808}; | |
st.local.v4.u32 [%rd2+432], {%r861, %r860, %r859, %r858}; | |
st.local.v4.u32 [%rd2+496], {%r13809, %r13810, %r13811, %r13812}; | |
mov.u32 %r12694, %r13812; | |
mov.u32 %r12696, %r13811; | |
mov.u32 %r12698, %r13810; | |
mov.u32 %r12700, %r13809; | |
mov.u32 %r12702, %r13808; | |
mov.u32 %r12704, %r13807; | |
mov.u32 %r12706, %r13806; | |
mov.u32 %r12708, %r13805; | |
mov.u32 %r12710, %r13804; | |
mov.u32 %r12712, %r13803; | |
mov.u32 %r12714, %r13802; | |
mov.u32 %r12716, %r13801; | |
mov.u32 %r12718, %r13800; | |
mov.u32 %r12720, %r13799; | |
mov.u32 %r12722, %r13798; | |
mov.u32 %r12724, %r13797; | |
mov.u32 %r13812, %r858; | |
mov.u32 %r13811, %r859; | |
mov.u32 %r13810, %r860; | |
mov.u32 %r13809, %r861; | |
mov.u32 %r13808, %r862; | |
mov.u32 %r13807, %r863; | |
mov.u32 %r13806, %r864; | |
mov.u32 %r13805, %r865; | |
mov.u32 %r13804, %r866; | |
mov.u32 %r13803, %r867; | |
mov.u32 %r13802, %r868; | |
mov.u32 %r13801, %r869; | |
mov.u32 %r13800, %r870; | |
mov.u32 %r13799, %r871; | |
mov.u32 %r13798, %r872; | |
mov.u32 %r13797, %r873; | |
mov.u32 %r13813, %r12724; | |
mov.u32 %r13814, %r12722; | |
mov.u32 %r13815, %r12720; | |
mov.u32 %r13816, %r12718; | |
mov.u32 %r13817, %r12716; | |
mov.u32 %r13818, %r12714; | |
mov.u32 %r13819, %r12712; | |
mov.u32 %r13820, %r12710; | |
mov.u32 %r13821, %r12708; | |
mov.u32 %r13822, %r12706; | |
mov.u32 %r13823, %r12704; | |
mov.u32 %r13824, %r12702; | |
mov.u32 %r13825, %r12700; | |
mov.u32 %r13826, %r12698; | |
mov.u32 %r13827, %r12696; | |
mov.u32 %r13828, %r12694; | |
BB12_258: | |
mov.u32 %r905, %r13797; | |
mov.u32 %r904, %r13798; | |
mov.u32 %r903, %r13799; | |
mov.u32 %r902, %r13800; | |
mov.u32 %r901, %r13801; | |
mov.u32 %r900, %r13802; | |
mov.u32 %r899, %r13803; | |
mov.u32 %r898, %r13804; | |
mov.u32 %r897, %r13805; | |
mov.u32 %r896, %r13806; | |
mov.u32 %r895, %r13807; | |
mov.u32 %r894, %r13808; | |
mov.u32 %r893, %r13809; | |
mov.u32 %r892, %r13810; | |
mov.u32 %r891, %r13811; | |
mov.u32 %r890, %r13812; | |
mov.u32 %r889, %r13813; | |
mov.u32 %r888, %r13814; | |
mov.u32 %r887, %r13815; | |
mov.u32 %r886, %r13816; | |
mov.u32 %r885, %r13817; | |
mov.u32 %r884, %r13818; | |
mov.u32 %r883, %r13819; | |
mov.u32 %r882, %r13820; | |
mov.u32 %r881, %r13821; | |
mov.u32 %r880, %r13822; | |
mov.u32 %r879, %r13823; | |
mov.u32 %r878, %r13824; | |
mov.u32 %r877, %r13825; | |
mov.u32 %r876, %r13826; | |
mov.u32 %r875, %r13827; | |
mov.u32 %r874, %r13828; | |
setp.le.u32 %p132, %r13573, %r905; | |
mov.u32 %r13605, %r905; | |
mov.u32 %r13606, %r904; | |
mov.u32 %r13607, %r903; | |
mov.u32 %r13608, %r902; | |
mov.u32 %r13609, %r901; | |
mov.u32 %r13610, %r900; | |
mov.u32 %r13611, %r899; | |
mov.u32 %r13612, %r898; | |
mov.u32 %r13613, %r897; | |
mov.u32 %r13614, %r896; | |
mov.u32 %r13615, %r895; | |
mov.u32 %r13616, %r894; | |
mov.u32 %r13617, %r893; | |
mov.u32 %r13618, %r892; | |
mov.u32 %r13619, %r891; | |
mov.u32 %r13620, %r890; | |
mov.u32 %r13621, %r889; | |
mov.u32 %r13622, %r888; | |
mov.u32 %r13623, %r887; | |
mov.u32 %r13624, %r886; | |
mov.u32 %r13625, %r885; | |
mov.u32 %r13626, %r884; | |
mov.u32 %r13627, %r883; | |
mov.u32 %r13628, %r882; | |
mov.u32 %r13629, %r881; | |
mov.u32 %r13630, %r880; | |
mov.u32 %r13631, %r879; | |
mov.u32 %r13632, %r878; | |
mov.u32 %r13633, %r877; | |
mov.u32 %r13634, %r876; | |
mov.u32 %r13635, %r875; | |
mov.u32 %r13636, %r874; | |
@%p132 bra BB12_260; | |
st.local.v4.u32 [%rd2+256], {%r905, %r904, %r903, %r902}; | |
st.local.v4.u32 [%rd2+384], {%r13573, %r13574, %r13575, %r13576}; | |
st.local.v4.u32 [%rd2+272], {%r901, %r900, %r899, %r898}; | |
st.local.v4.u32 [%rd2+400], {%r13577, %r13578, %r13579, %r13580}; | |
st.local.v4.u32 [%rd2+288], {%r897, %r896, %r895, %r894}; | |
st.local.v4.u32 [%rd2+416], {%r13581, %r13582, %r13583, %r13584}; | |
st.local.v4.u32 [%rd2+304], {%r893, %r892, %r891, %r890}; | |
st.local.v4.u32 [%rd2+432], {%r13585, %r13586, %r13587, %r13588}; | |
st.local.v4.u32 [%rd2+320], {%r889, %r888, %r887, %r886}; | |
st.local.v4.u32 [%rd2+448], {%r13589, %r13590, %r13591, %r13592}; | |
st.local.v4.u32 [%rd2+336], {%r885, %r884, %r883, %r882}; | |
st.local.v4.u32 [%rd2+464], {%r13593, %r13594, %r13595, %r13596}; | |
st.local.v4.u32 [%rd2+352], {%r881, %r880, %r879, %r878}; | |
st.local.v4.u32 [%rd2+480], {%r13597, %r13598, %r13599, %r13600}; | |
st.local.v4.u32 [%rd2+368], {%r877, %r876, %r875, %r874}; | |
st.local.v4.u32 [%rd2+496], {%r13601, %r13602, %r13603, %r13604}; | |
mov.u32 %r12518, %r13604; | |
mov.u32 %r12520, %r13603; | |
mov.u32 %r12522, %r13602; | |
mov.u32 %r12524, %r13601; | |
mov.u32 %r12526, %r13600; | |
mov.u32 %r12528, %r13599; | |
mov.u32 %r12530, %r13598; | |
mov.u32 %r12532, %r13597; | |
mov.u32 %r12534, %r13596; | |
mov.u32 %r12536, %r13595; | |
mov.u32 %r12538, %r13594; | |
mov.u32 %r12540, %r13593; | |
mov.u32 %r12542, %r13592; | |
mov.u32 %r12544, %r13591; | |
mov.u32 %r12546, %r13590; | |
mov.u32 %r12548, %r13589; | |
mov.u32 %r12550, %r13588; | |
mov.u32 %r12552, %r13587; | |
mov.u32 %r12554, %r13586; | |
mov.u32 %r12556, %r13585; | |
mov.u32 %r12558, %r13584; | |
mov.u32 %r12560, %r13583; | |
mov.u32 %r12562, %r13582; | |
mov.u32 %r12564, %r13581; | |
mov.u32 %r12566, %r13580; | |
mov.u32 %r12568, %r13579; | |
mov.u32 %r12570, %r13578; | |
mov.u32 %r12572, %r13577; | |
mov.u32 %r12574, %r13576; | |
mov.u32 %r12576, %r13575; | |
mov.u32 %r12578, %r13574; | |
mov.u32 %r12580, %r13573; | |
mov.u32 %r13604, %r874; | |
mov.u32 %r13603, %r875; | |
mov.u32 %r13602, %r876; | |
mov.u32 %r13601, %r877; | |
mov.u32 %r13600, %r878; | |
mov.u32 %r13599, %r879; | |
mov.u32 %r13598, %r880; | |
mov.u32 %r13597, %r881; | |
mov.u32 %r13596, %r882; | |
mov.u32 %r13595, %r883; | |
mov.u32 %r13594, %r884; | |
mov.u32 %r13593, %r885; | |
mov.u32 %r13592, %r886; | |
mov.u32 %r13591, %r887; | |
mov.u32 %r13590, %r888; | |
mov.u32 %r13589, %r889; | |
mov.u32 %r13588, %r890; | |
mov.u32 %r13587, %r891; | |
mov.u32 %r13586, %r892; | |
mov.u32 %r13585, %r893; | |
mov.u32 %r13584, %r894; | |
mov.u32 %r13583, %r895; | |
mov.u32 %r13582, %r896; | |
mov.u32 %r13581, %r897; | |
mov.u32 %r13580, %r898; | |
mov.u32 %r13579, %r899; | |
mov.u32 %r13578, %r900; | |
mov.u32 %r13577, %r901; | |
mov.u32 %r13576, %r902; | |
mov.u32 %r13575, %r903; | |
mov.u32 %r13574, %r904; | |
mov.u32 %r13573, %r905; | |
mov.u32 %r13605, %r12580; | |
mov.u32 %r13606, %r12578; | |
mov.u32 %r13607, %r12576; | |
mov.u32 %r13608, %r12574; | |
mov.u32 %r13609, %r12572; | |
mov.u32 %r13610, %r12570; | |
mov.u32 %r13611, %r12568; | |
mov.u32 %r13612, %r12566; | |
mov.u32 %r13613, %r12564; | |
mov.u32 %r13614, %r12562; | |
mov.u32 %r13615, %r12560; | |
mov.u32 %r13616, %r12558; | |
mov.u32 %r13617, %r12556; | |
mov.u32 %r13618, %r12554; | |
mov.u32 %r13619, %r12552; | |
mov.u32 %r13620, %r12550; | |
mov.u32 %r13621, %r12548; | |
mov.u32 %r13622, %r12546; | |
mov.u32 %r13623, %r12544; | |
mov.u32 %r13624, %r12542; | |
mov.u32 %r13625, %r12540; | |
mov.u32 %r13626, %r12538; | |
mov.u32 %r13627, %r12536; | |
mov.u32 %r13628, %r12534; | |
mov.u32 %r13629, %r12532; | |
mov.u32 %r13630, %r12530; | |
mov.u32 %r13631, %r12528; | |
mov.u32 %r13632, %r12526; | |
mov.u32 %r13633, %r12524; | |
mov.u32 %r13634, %r12522; | |
mov.u32 %r13635, %r12520; | |
mov.u32 %r13636, %r12518; | |
BB12_260: | |
mov.u32 %r969, %r13573; | |
mov.u32 %r968, %r13574; | |
mov.u32 %r967, %r13575; | |
mov.u32 %r966, %r13576; | |
mov.u32 %r965, %r13577; | |
mov.u32 %r964, %r13578; | |
mov.u32 %r963, %r13579; | |
mov.u32 %r962, %r13580; | |
mov.u32 %r961, %r13581; | |
mov.u32 %r960, %r13582; | |
mov.u32 %r959, %r13583; | |
mov.u32 %r958, %r13584; | |
mov.u32 %r957, %r13585; | |
mov.u32 %r956, %r13586; | |
mov.u32 %r955, %r13587; | |
mov.u32 %r954, %r13588; | |
mov.u32 %r953, %r13589; | |
mov.u32 %r952, %r13590; | |
mov.u32 %r951, %r13591; | |
mov.u32 %r950, %r13592; | |
mov.u32 %r949, %r13593; | |
mov.u32 %r948, %r13594; | |
mov.u32 %r947, %r13595; | |
mov.u32 %r946, %r13596; | |
mov.u32 %r945, %r13597; | |
mov.u32 %r944, %r13598; | |
mov.u32 %r943, %r13599; | |
mov.u32 %r942, %r13600; | |
mov.u32 %r941, %r13601; | |
mov.u32 %r940, %r13602; | |
mov.u32 %r939, %r13603; | |
mov.u32 %r938, %r13604; | |
mov.u32 %r937, %r13605; | |
mov.u32 %r936, %r13606; | |
mov.u32 %r935, %r13607; | |
mov.u32 %r934, %r13608; | |
mov.u32 %r933, %r13609; | |
mov.u32 %r932, %r13610; | |
mov.u32 %r931, %r13611; | |
mov.u32 %r930, %r13612; | |
mov.u32 %r929, %r13613; | |
mov.u32 %r928, %r13614; | |
mov.u32 %r927, %r13615; | |
mov.u32 %r926, %r13616; | |
mov.u32 %r925, %r13617; | |
mov.u32 %r924, %r13618; | |
mov.u32 %r923, %r13619; | |
mov.u32 %r922, %r13620; | |
mov.u32 %r921, %r13621; | |
mov.u32 %r920, %r13622; | |
mov.u32 %r919, %r13623; | |
mov.u32 %r918, %r13624; | |
mov.u32 %r917, %r13625; | |
mov.u32 %r916, %r13626; | |
mov.u32 %r915, %r13627; | |
mov.u32 %r914, %r13628; | |
mov.u32 %r913, %r13629; | |
mov.u32 %r912, %r13630; | |
mov.u32 %r911, %r13631; | |
mov.u32 %r910, %r13632; | |
mov.u32 %r909, %r13633; | |
mov.u32 %r908, %r13634; | |
mov.u32 %r907, %r13635; | |
mov.u32 %r906, %r13636; | |
setp.le.u32 %p133, %r13061, %r969; | |
mov.u32 %r13125, %r969; | |
mov.u32 %r13126, %r968; | |
mov.u32 %r13127, %r967; | |
mov.u32 %r13128, %r966; | |
mov.u32 %r13129, %r965; | |
mov.u32 %r13130, %r964; | |
mov.u32 %r13131, %r963; | |
mov.u32 %r13132, %r962; | |
mov.u32 %r13133, %r961; | |
mov.u32 %r13134, %r960; | |
mov.u32 %r13135, %r959; | |
mov.u32 %r13136, %r958; | |
mov.u32 %r13137, %r957; | |
mov.u32 %r13138, %r956; | |
mov.u32 %r13139, %r955; | |
mov.u32 %r13140, %r954; | |
mov.u32 %r13141, %r953; | |
mov.u32 %r13142, %r952; | |
mov.u32 %r13143, %r951; | |
mov.u32 %r13144, %r950; | |
mov.u32 %r13145, %r949; | |
mov.u32 %r13146, %r948; | |
mov.u32 %r13147, %r947; | |
mov.u32 %r13148, %r946; | |
mov.u32 %r13149, %r945; | |
mov.u32 %r13150, %r944; | |
mov.u32 %r13151, %r943; | |
mov.u32 %r13152, %r942; | |
mov.u32 %r13153, %r941; | |
mov.u32 %r13154, %r940; | |
mov.u32 %r13155, %r939; | |
mov.u32 %r13156, %r938; | |
mov.u32 %r13157, %r937; | |
mov.u32 %r13158, %r936; | |
mov.u32 %r13159, %r935; | |
mov.u32 %r13160, %r934; | |
mov.u32 %r13161, %r933; | |
mov.u32 %r13162, %r932; | |
mov.u32 %r13163, %r931; | |
mov.u32 %r13164, %r930; | |
mov.u32 %r13165, %r929; | |
mov.u32 %r13166, %r928; | |
mov.u32 %r13167, %r927; | |
mov.u32 %r13168, %r926; | |
mov.u32 %r13169, %r925; | |
mov.u32 %r13170, %r924; | |
mov.u32 %r13171, %r923; | |
mov.u32 %r13172, %r922; | |
mov.u32 %r13173, %r921; | |
mov.u32 %r13174, %r920; | |
mov.u32 %r13175, %r919; | |
mov.u32 %r13176, %r918; | |
mov.u32 %r13177, %r917; | |
mov.u32 %r13178, %r916; | |
mov.u32 %r13179, %r915; | |
mov.u32 %r13180, %r914; | |
mov.u32 %r13181, %r913; | |
mov.u32 %r13182, %r912; | |
mov.u32 %r13183, %r911; | |
mov.u32 %r13184, %r910; | |
mov.u32 %r13185, %r909; | |
mov.u32 %r13186, %r908; | |
mov.u32 %r13187, %r907; | |
mov.u32 %r13188, %r906; | |
@%p133 bra BB12_262; | |
st.local.v4.u32 [%rd2], {%r969, %r968, %r967, %r966}; | |
st.local.v4.u32 [%rd2+256], {%r13061, %r13062, %r13063, %r13064}; | |
st.local.v4.u32 [%rd2+16], {%r965, %r964, %r963, %r962}; | |
st.local.v4.u32 [%rd2+272], {%r13065, %r13066, %r13067, %r13068}; | |
st.local.v4.u32 [%rd2+32], {%r961, %r960, %r959, %r958}; | |
st.local.v4.u32 [%rd2+288], {%r13069, %r13070, %r13071, %r13072}; | |
st.local.v4.u32 [%rd2+48], {%r957, %r956, %r955, %r954}; | |
st.local.v4.u32 [%rd2+304], {%r13073, %r13074, %r13075, %r13076}; | |
st.local.v4.u32 [%rd2+64], {%r953, %r952, %r951, %r950}; | |
st.local.v4.u32 [%rd2+320], {%r13077, %r13078, %r13079, %r13080}; | |
st.local.v4.u32 [%rd2+80], {%r949, %r948, %r947, %r946}; | |
st.local.v4.u32 [%rd2+336], {%r13081, %r13082, %r13083, %r13084}; | |
st.local.v4.u32 [%rd2+96], {%r945, %r944, %r943, %r942}; | |
st.local.v4.u32 [%rd2+352], {%r13085, %r13086, %r13087, %r13088}; | |
st.local.v4.u32 [%rd2+112], {%r941, %r940, %r939, %r938}; | |
st.local.v4.u32 [%rd2+368], {%r13089, %r13090, %r13091, %r13092}; | |
st.local.v4.u32 [%rd2+128], {%r937, %r936, %r935, %r934}; | |
st.local.v4.u32 [%rd2+384], {%r13093, %r13094, %r13095, %r13096}; | |
st.local.v2.u32 [%rd2+400], {%r13097, %r13098}; | |
st.local.u32 [%rd2+408], %r13099; | |
st.local.v4.u32 [%rd2+144], {%r933, %r932, %r931, %r930}; | |
st.local.u32 [%rd2+412], %r13100; | |
st.local.u32 [%rd2+160], %r929; | |
st.local.u32 [%rd2+416], %r13101; | |
st.local.u32 [%rd2+164], %r928; | |
st.local.u32 [%rd2+420], %r13102; | |
st.local.u32 [%rd2+168], %r927; | |
st.local.u32 [%rd2+424], %r13103; | |
st.local.u32 [%rd2+172], %r926; | |
st.local.u32 [%rd2+428], %r13104; | |
st.local.u32 [%rd2+176], %r925; | |
st.local.u32 [%rd2+432], %r13105; | |
st.local.u32 [%rd2+180], %r924; | |
st.local.u32 [%rd2+436], %r13106; | |
st.local.u32 [%rd2+184], %r923; | |
st.local.u32 [%rd2+440], %r13107; | |
st.local.u32 [%rd2+188], %r922; | |
st.local.u32 [%rd2+444], %r13108; | |
st.local.u32 [%rd2+192], %r921; | |
st.local.u32 [%rd2+448], %r13109; | |
st.local.u32 [%rd2+196], %r920; | |
st.local.u32 [%rd2+452], %r13110; | |
st.local.u32 [%rd2+200], %r919; | |
st.local.u32 [%rd2+456], %r13111; | |
st.local.u32 [%rd2+204], %r918; | |
st.local.u32 [%rd2+460], %r13112; | |
st.local.u32 [%rd2+208], %r917; | |
st.local.u32 [%rd2+464], %r13113; | |
st.local.u32 [%rd2+212], %r916; | |
st.local.u32 [%rd2+468], %r13114; | |
st.local.u32 [%rd2+216], %r915; | |
st.local.u32 [%rd2+472], %r13115; | |
st.local.u32 [%rd2+220], %r914; | |
st.local.u32 [%rd2+476], %r13116; | |
st.local.u32 [%rd2+224], %r913; | |
st.local.u32 [%rd2+480], %r13117; | |
st.local.u32 [%rd2+228], %r912; | |
st.local.u32 [%rd2+484], %r13118; | |
st.local.u32 [%rd2+232], %r911; | |
st.local.u32 [%rd2+488], %r13119; | |
st.local.u32 [%rd2+236], %r910; | |
st.local.u32 [%rd2+492], %r13120; | |
st.local.u32 [%rd2+240], %r909; | |
st.local.u32 [%rd2+496], %r13121; | |
st.local.u32 [%rd2+244], %r908; | |
st.local.u32 [%rd2+500], %r13122; | |
st.local.u32 [%rd2+248], %r907; | |
st.local.u32 [%rd2+504], %r13123; | |
st.local.u32 [%rd2+252], %r906; | |
st.local.u32 [%rd2+508], %r13124; | |
mov.u32 %r12102, %r13124; | |
mov.u32 %r12104, %r13123; | |
mov.u32 %r12106, %r13122; | |
mov.u32 %r12108, %r13121; | |
mov.u32 %r12110, %r13120; | |
mov.u32 %r12112, %r13119; | |
mov.u32 %r12114, %r13118; | |
mov.u32 %r12116, %r13117; | |
mov.u32 %r12118, %r13116; | |
mov.u32 %r12120, %r13115; | |
mov.u32 %r12122, %r13114; | |
mov.u32 %r12124, %r13113; | |
mov.u32 %r12126, %r13112; | |
mov.u32 %r12128, %r13111; | |
mov.u32 %r12130, %r13110; | |
mov.u32 %r12132, %r13109; | |
mov.u32 %r12134, %r13108; | |
mov.u32 %r12136, %r13107; | |
mov.u32 %r12138, %r13106; | |
mov.u32 %r12140, %r13105; | |
mov.u32 %r12142, %r13104; | |
mov.u32 %r12144, %r13103; | |
mov.u32 %r12146, %r13102; | |
mov.u32 %r12148, %r13101; | |
mov.u32 %r12150, %r13100; | |
mov.u32 %r12152, %r13099; | |
mov.u32 %r12154, %r13098; | |
mov.u32 %r12156, %r13097; | |
mov.u32 %r12158, %r13096; | |
mov.u32 %r12160, %r13095; | |
mov.u32 %r12162, %r13094; | |
mov.u32 %r12164, %r13093; | |
mov.u32 %r12166, %r13092; | |
mov.u32 %r12168, %r13091; | |
mov.u32 %r12170, %r13090; | |
mov.u32 %r12172, %r13089; | |
mov.u32 %r12174, %r13088; | |
mov.u32 %r12176, %r13087; | |
mov.u32 %r12178, %r13086; | |
mov.u32 %r12180, %r13085; | |
mov.u32 %r12182, %r13084; | |
mov.u32 %r12184, %r13083; | |
mov.u32 %r12186, %r13082; | |
mov.u32 %r12188, %r13081; | |
mov.u32 %r12190, %r13080; | |
mov.u32 %r12192, %r13079; | |
mov.u32 %r12194, %r13078; | |
mov.u32 %r12196, %r13077; | |
mov.u32 %r12198, %r13076; | |
mov.u32 %r12200, %r13075; | |
mov.u32 %r12202, %r13074; | |
mov.u32 %r12204, %r13073; | |
mov.u32 %r12206, %r13072; | |
mov.u32 %r12208, %r13071; | |
mov.u32 %r12210, %r13070; | |
mov.u32 %r12212, %r13069; | |
mov.u32 %r12214, %r13068; | |
mov.u32 %r12216, %r13067; | |
mov.u32 %r12218, %r13066; | |
mov.u32 %r12220, %r13065; | |
mov.u32 %r12222, %r13064; | |
mov.u32 %r12224, %r13063; | |
mov.u32 %r12226, %r13062; | |
mov.u32 %r12228, %r13061; | |
mov.u32 %r13124, %r906; | |
mov.u32 %r13123, %r907; | |
mov.u32 %r13122, %r908; | |
mov.u32 %r13121, %r909; | |
mov.u32 %r13120, %r910; | |
mov.u32 %r13119, %r911; | |
mov.u32 %r13118, %r912; | |
mov.u32 %r13117, %r913; | |
mov.u32 %r13116, %r914; | |
mov.u32 %r13115, %r915; | |
mov.u32 %r13114, %r916; | |
mov.u32 %r13113, %r917; | |
mov.u32 %r13112, %r918; | |
mov.u32 %r13111, %r919; | |
mov.u32 %r13110, %r920; | |
mov.u32 %r13109, %r921; | |
mov.u32 %r13108, %r922; | |
mov.u32 %r13107, %r923; | |
mov.u32 %r13106, %r924; | |
mov.u32 %r13105, %r925; | |
mov.u32 %r13104, %r926; | |
mov.u32 %r13103, %r927; | |
mov.u32 %r13102, %r928; | |
mov.u32 %r13101, %r929; | |
mov.u32 %r13100, %r930; | |
mov.u32 %r13099, %r931; | |
mov.u32 %r13098, %r932; | |
mov.u32 %r13097, %r933; | |
mov.u32 %r13096, %r934; | |
mov.u32 %r13095, %r935; | |
mov.u32 %r13094, %r936; | |
mov.u32 %r13093, %r937; | |
mov.u32 %r13092, %r938; | |
mov.u32 %r13091, %r939; | |
mov.u32 %r13090, %r940; | |
mov.u32 %r13089, %r941; | |
mov.u32 %r13088, %r942; | |
mov.u32 %r13087, %r943; | |
mov.u32 %r13086, %r944; | |
mov.u32 %r13085, %r945; | |
mov.u32 %r13084, %r946; | |
mov.u32 %r13083, %r947; | |
mov.u32 %r13082, %r948; | |
mov.u32 %r13081, %r949; | |
mov.u32 %r13080, %r950; | |
mov.u32 %r13079, %r951; | |
mov.u32 %r13078, %r952; | |
mov.u32 %r13077, %r953; | |
mov.u32 %r13076, %r954; | |
mov.u32 %r13075, %r955; | |
mov.u32 %r13074, %r956; | |
mov.u32 %r13073, %r957; | |
mov.u32 %r13072, %r958; | |
mov.u32 %r13071, %r959; | |
mov.u32 %r13070, %r960; | |
mov.u32 %r13069, %r961; | |
mov.u32 %r13068, %r962; | |
mov.u32 %r13067, %r963; | |
mov.u32 %r13066, %r964; | |
mov.u32 %r13065, %r965; | |
mov.u32 %r13064, %r966; | |
mov.u32 %r13063, %r967; | |
mov.u32 %r13062, %r968; | |
mov.u32 %r13061, %r969; | |
mov.u32 %r13125, %r12228; | |
mov.u32 %r13126, %r12226; | |
mov.u32 %r13127, %r12224; | |
mov.u32 %r13128, %r12222; | |
mov.u32 %r13129, %r12220; | |
mov.u32 %r13130, %r12218; | |
mov.u32 %r13131, %r12216; | |
mov.u32 %r13132, %r12214; | |
mov.u32 %r13133, %r12212; | |
mov.u32 %r13134, %r12210; | |
mov.u32 %r13135, %r12208; | |
mov.u32 %r13136, %r12206; | |
mov.u32 %r13137, %r12204; | |
mov.u32 %r13138, %r12202; | |
mov.u32 %r13139, %r12200; | |
mov.u32 %r13140, %r12198; | |
mov.u32 %r13141, %r12196; | |
mov.u32 %r13142, %r12194; | |
mov.u32 %r13143, %r12192; | |
mov.u32 %r13144, %r12190; | |
mov.u32 %r13145, %r12188; | |
mov.u32 %r13146, %r12186; | |
mov.u32 %r13147, %r12184; | |
mov.u32 %r13148, %r12182; | |
mov.u32 %r13149, %r12180; | |
mov.u32 %r13150, %r12178; | |
mov.u32 %r13151, %r12176; | |
mov.u32 %r13152, %r12174; | |
mov.u32 %r13153, %r12172; | |
mov.u32 %r13154, %r12170; | |
mov.u32 %r13155, %r12168; | |
mov.u32 %r13156, %r12166; | |
mov.u32 %r13157, %r12164; | |
mov.u32 %r13158, %r12162; | |
mov.u32 %r13159, %r12160; | |
mov.u32 %r13160, %r12158; | |
mov.u32 %r13161, %r12156; | |
mov.u32 %r13162, %r12154; | |
mov.u32 %r13163, %r12152; | |
mov.u32 %r13164, %r12150; | |
mov.u32 %r13165, %r12148; | |
mov.u32 %r13166, %r12146; | |
mov.u32 %r13167, %r12144; | |
mov.u32 %r13168, %r12142; | |
mov.u32 %r13169, %r12140; | |
mov.u32 %r13170, %r12138; | |
mov.u32 %r13171, %r12136; | |
mov.u32 %r13172, %r12134; | |
mov.u32 %r13173, %r12132; | |
mov.u32 %r13174, %r12130; | |
mov.u32 %r13175, %r12128; | |
mov.u32 %r13176, %r12126; | |
mov.u32 %r13177, %r12124; | |
mov.u32 %r13178, %r12122; | |
mov.u32 %r13179, %r12120; | |
mov.u32 %r13180, %r12118; | |
mov.u32 %r13181, %r12116; | |
mov.u32 %r13182, %r12114; | |
mov.u32 %r13183, %r12112; | |
mov.u32 %r13184, %r12110; | |
mov.u32 %r13185, %r12108; | |
mov.u32 %r13186, %r12106; | |
mov.u32 %r13187, %r12104; | |
mov.u32 %r13188, %r12102; | |
BB12_262: | |
bfe.u32 %r6200, %r10, 22, 6; | |
mul.lo.s64 %rd1345, %rd14, 1792; | |
add.s64 %rd1346, %rd6, %rd1345; | |
mul.wide.u32 %rd1347, %r6200, 28; | |
add.s64 %rd1348, %rd1346, %rd1347; | |
ld.global.u32 %r1098, [%rd1348]; | |
and.b32 %r6201, %r1098, 65535; | |
mul.wide.u32 %rd1349, %r6201, 1792; | |
add.s64 %rd1350, %rd4, %rd1349; | |
bfe.u32 %r6202, %r1098, 16, 6; | |
mul.wide.u32 %rd1351, %r6202, 28; | |
add.s64 %rd1352, %rd1350, %rd1351; | |
ld.global.u32 %r1099, [%rd1352+-4]; | |
and.b32 %r6203, %r1099, 65535; | |
mul.wide.u32 %rd1353, %r6203, 1792; | |
add.s64 %rd1354, %rd6, %rd1353; | |
bfe.u32 %r6204, %r1099, 16, 6; | |
mul.wide.u32 %rd1355, %r6204, 28; | |
add.s64 %rd1356, %rd1354, %rd1355; | |
ld.global.u32 %r1100, [%rd1356+-4]; | |
and.b32 %r6205, %r1100, 65535; | |
mul.wide.u32 %rd1357, %r6205, 1792; | |
add.s64 %rd1358, %rd4, %rd1357; | |
bfe.u32 %r6206, %r1100, 16, 6; | |
mul.wide.u32 %rd1359, %r6206, 28; | |
add.s64 %rd1360, %rd1358, %rd1359; | |
ld.global.u32 %r1101, [%rd1360+-8]; | |
and.b32 %r6207, %r1101, 65535; | |
mul.wide.u32 %rd1361, %r6207, 1792; | |
add.s64 %rd1362, %rd6, %rd1361; | |
bfe.u32 %r6208, %r1101, 16, 6; | |
mul.wide.u32 %rd1363, %r6208, 28; | |
add.s64 %rd1364, %rd1362, %rd1363; | |
ld.global.u32 %r1102, [%rd1364+-8]; | |
and.b32 %r6209, %r1102, 65535; | |
mul.wide.u32 %rd1365, %r6209, 1792; | |
add.s64 %rd1366, %rd4, %rd1365; | |
cvt.u64.u32 %rd79, %r6201; | |
cvt.u64.u32 %rd80, %r6203; | |
cvt.u64.u32 %rd81, %r6205; | |
cvt.u64.u32 %rd82, %r6207; | |
cvt.u64.u32 %rd83, %r6209; | |
bfe.u32 %r6210, %r1102, 16, 6; | |
mul.wide.u32 %rd1367, %r6210, 28; | |
add.s64 %rd1368, %rd1366, %rd1367; | |
ld.global.u32 %r1103, [%rd1368+-12]; | |
and.b32 %r6211, %r1103, 65535; | |
cvt.u64.u32 %rd84, %r6211; | |
bfe.u32 %r6212, %r1103, 16, 6; | |
mul.wide.u32 %rd1369, %r6211, 1792; | |
add.s64 %rd1370, %rd415, %rd1369; | |
mul.wide.u32 %rd1371, %r6212, 28; | |
add.s64 %rd1372, %rd1370, %rd1371; | |
ld.global.u32 %r6213, [%rd1372]; | |
and.b32 %r6214, %r6213, 65535; | |
bfe.u32 %r6215, %r6213, 16, 6; | |
mul.wide.u32 %rd1373, %r6214, 1792; | |
add.s64 %rd1374, %rd414, %rd1373; | |
mul.wide.u32 %rd1375, %r6215, 28; | |
add.s64 %rd1376, %rd1374, %rd1375; | |
ld.global.u32 %r6216, [%rd1376]; | |
and.b32 %r6217, %r6216, 65535; | |
shl.b32 %r6218, %r6217, 6; | |
bfe.u32 %r6219, %r6216, 16, 6; | |
or.b32 %r1104, %r6218, %r6219; | |
st.local.u32 [%rd2+512], %r1104; | |
bfe.u32 %r6220, %r6213, 22, 6; | |
mul.wide.u32 %rd1377, %r6220, 28; | |
add.s64 %rd1378, %rd1374, %rd1377; | |
ld.global.u32 %r6221, [%rd1378]; | |
and.b32 %r6222, %r6221, 65535; | |
shl.b32 %r6223, %r6222, 6; | |
bfe.u32 %r6224, %r6221, 16, 6; | |
or.b32 %r15874, %r6223, %r6224; | |
st.local.u32 [%rd2+516], %r15874; | |
setp.le.u32 %p134, %r1104, %r15874; | |
mov.u32 %r15873, %r1104; | |
@%p134 bra BB12_264; | |
st.local.v2.u32 [%rd2+512], {%r15874, %r1104}; | |
mov.u32 %r13957, %r15874; | |
mov.u32 %r15874, %r1104; | |
mov.u32 %r15873, %r13957; | |
BB12_264: | |
mov.u32 %r15869, %r15873; | |
mov.u32 %r15870, %r15874; | |
bfe.u32 %r6225, %r1103, 22, 6; | |
mul.lo.s64 %rd1379, %rd84, 1792; | |
add.s64 %rd1380, %rd415, %rd1379; | |
mul.wide.u32 %rd1381, %r6225, 28; | |
add.s64 %rd1382, %rd1380, %rd1381; | |
ld.global.u32 %r6226, [%rd1382]; | |
and.b32 %r6227, %r6226, 65535; | |
bfe.u32 %r6228, %r6226, 16, 6; | |
mul.wide.u32 %rd1383, %r6227, 1792; | |
add.s64 %rd1384, %rd414, %rd1383; | |
mul.wide.u32 %rd1385, %r6228, 28; | |
add.s64 %rd1386, %rd1384, %rd1385; | |
ld.global.u32 %r6229, [%rd1386]; | |
and.b32 %r6230, %r6229, 65535; | |
shl.b32 %r6231, %r6230, 6; | |
bfe.u32 %r6232, %r6229, 16, 6; | |
or.b32 %r1108, %r6231, %r6232; | |
st.local.u32 [%rd2+520], %r1108; | |
bfe.u32 %r6233, %r6226, 22, 6; | |
mul.wide.u32 %rd1387, %r6233, 28; | |
add.s64 %rd1388, %rd1384, %rd1387; | |
ld.global.u32 %r6234, [%rd1388]; | |
and.b32 %r6235, %r6234, 65535; | |
shl.b32 %r6236, %r6235, 6; | |
bfe.u32 %r6237, %r6234, 16, 6; | |
or.b32 %r15876, %r6236, %r6237; | |
st.local.u32 [%rd2+524], %r15876; | |
setp.le.u32 %p135, %r1108, %r15876; | |
mov.u32 %r15875, %r1108; | |
@%p135 bra BB12_266; | |
st.local.v2.u32 [%rd2+520], {%r15876, %r1108}; | |
mov.u32 %r13963, %r15876; | |
mov.u32 %r15876, %r1108; | |
mov.u32 %r15875, %r13963; | |
BB12_266: | |
mov.u32 %r1111, %r15875; | |
mov.u32 %r1110, %r15876; | |
setp.le.u32 %p136, %r15869, %r1111; | |
mov.u32 %r15871, %r1111; | |
mov.u32 %r15872, %r1110; | |
@%p136 bra BB12_268; | |
st.local.v4.u32 [%rd2+512], {%r1111, %r1110, %r15869, %r15870}; | |
mov.u32 %r13960, %r15870; | |
mov.u32 %r13962, %r15869; | |
mov.u32 %r15870, %r1110; | |
mov.u32 %r15869, %r1111; | |
mov.u32 %r15871, %r13962; | |
mov.u32 %r15872, %r13960; | |
BB12_268: | |
mov.u32 %r15861, %r15869; | |
mov.u32 %r15862, %r15870; | |
mov.u32 %r15863, %r15871; | |
mov.u32 %r15864, %r15872; | |
mul.lo.s64 %rd1389, %rd83, 1792; | |
add.s64 %rd1390, %rd4, %rd1389; | |
bfe.u32 %r6238, %r1102, 22, 6; | |
mul.wide.u32 %rd1391, %r6238, 28; | |
add.s64 %rd1392, %rd1390, %rd1391; | |
ld.global.u32 %r1116, [%rd1392+-12]; | |
and.b32 %r6239, %r1116, 65535; | |
cvt.u64.u32 %rd85, %r6239; | |
bfe.u32 %r6240, %r1116, 16, 6; | |
mul.wide.u32 %rd1393, %r6239, 1792; | |
add.s64 %rd1394, %rd415, %rd1393; | |
mul.wide.u32 %rd1395, %r6240, 28; | |
add.s64 %rd1396, %rd1394, %rd1395; | |
ld.global.u32 %r6241, [%rd1396]; | |
and.b32 %r6242, %r6241, 65535; | |
bfe.u32 %r6243, %r6241, 16, 6; | |
mul.wide.u32 %rd1397, %r6242, 1792; | |
add.s64 %rd1398, %rd414, %rd1397; | |
mul.wide.u32 %rd1399, %r6243, 28; | |
add.s64 %rd1400, %rd1398, %rd1399; | |
ld.global.u32 %r6244, [%rd1400]; | |
and.b32 %r6245, %r6244, 65535; | |
shl.b32 %r6246, %r6245, 6; | |
bfe.u32 %r6247, %r6244, 16, 6; | |
or.b32 %r1117, %r6246, %r6247; | |
st.local.u32 [%rd2+528], %r1117; | |
bfe.u32 %r6248, %r6241, 22, 6; | |
mul.wide.u32 %rd1401, %r6248, 28; | |
add.s64 %rd1402, %rd1398, %rd1401; | |
ld.global.u32 %r6249, [%rd1402]; | |
and.b32 %r6250, %r6249, 65535; | |
shl.b32 %r6251, %r6250, 6; | |
bfe.u32 %r6252, %r6249, 16, 6; | |
or.b32 %r15882, %r6251, %r6252; | |
st.local.u32 [%rd2+532], %r15882; | |
setp.le.u32 %p137, %r1117, %r15882; | |
mov.u32 %r15881, %r1117; | |
@%p137 bra BB12_270; | |
st.local.v2.u32 [%rd2+528], {%r15882, %r1117}; | |
mov.u32 %r13977, %r15882; | |
mov.u32 %r15882, %r1117; | |
mov.u32 %r15881, %r13977; | |
BB12_270: | |
mov.u32 %r15877, %r15881; | |
mov.u32 %r15878, %r15882; | |
bfe.u32 %r6253, %r1116, 22, 6; | |
mul.lo.s64 %rd1403, %rd85, 1792; | |
add.s64 %rd1404, %rd415, %rd1403; | |
mul.wide.u32 %rd1405, %r6253, 28; | |
add.s64 %rd1406, %rd1404, %rd1405; | |
ld.global.u32 %r6254, [%rd1406]; | |
and.b32 %r6255, %r6254, 65535; | |
bfe.u32 %r6256, %r6254, 16, 6; | |
mul.wide.u32 %rd1407, %r6255, 1792; | |
add.s64 %rd1408, %rd414, %rd1407; | |
mul.wide.u32 %rd1409, %r6256, 28; | |
add.s64 %rd1410, %rd1408, %rd1409; | |
ld.global.u32 %r6257, [%rd1410]; | |
and.b32 %r6258, %r6257, 65535; | |
shl.b32 %r6259, %r6258, 6; | |
bfe.u32 %r6260, %r6257, 16, 6; | |
or.b32 %r1121, %r6259, %r6260; | |
st.local.u32 [%rd2+536], %r1121; | |
bfe.u32 %r6261, %r6254, 22, 6; | |
mul.wide.u32 %rd1411, %r6261, 28; | |
add.s64 %rd1412, %rd1408, %rd1411; | |
ld.global.u32 %r6262, [%rd1412]; | |
and.b32 %r6263, %r6262, 65535; | |
shl.b32 %r6264, %r6263, 6; | |
bfe.u32 %r6265, %r6262, 16, 6; | |
or.b32 %r15884, %r6264, %r6265; | |
st.local.u32 [%rd2+540], %r15884; | |
setp.le.u32 %p138, %r1121, %r15884; | |
mov.u32 %r15883, %r1121; | |
@%p138 bra BB12_272; | |
st.local.v2.u32 [%rd2+536], {%r15884, %r1121}; | |
mov.u32 %r13983, %r15884; | |
mov.u32 %r15884, %r1121; | |
mov.u32 %r15883, %r13983; | |
BB12_272: | |
mov.u32 %r1124, %r15883; | |
mov.u32 %r1123, %r15884; | |
setp.le.u32 %p139, %r15877, %r1124; | |
mov.u32 %r15879, %r1124; | |
mov.u32 %r15880, %r1123; | |
@%p139 bra BB12_274; | |
st.local.v4.u32 [%rd2+528], {%r1124, %r1123, %r15877, %r15878}; | |
mov.u32 %r13980, %r15878; | |
mov.u32 %r13982, %r15877; | |
mov.u32 %r15878, %r1123; | |
mov.u32 %r15877, %r1124; | |
mov.u32 %r15879, %r13982; | |
mov.u32 %r15880, %r13980; | |
BB12_274: | |
mov.u32 %r1128, %r15877; | |
mov.u32 %r1127, %r15878; | |
mov.u32 %r1126, %r15879; | |
mov.u32 %r1125, %r15880; | |
setp.le.u32 %p140, %r15861, %r1128; | |
mov.u32 %r15865, %r1128; | |
mov.u32 %r15866, %r1127; | |
mov.u32 %r15867, %r1126; | |
mov.u32 %r15868, %r1125; | |
@%p140 bra BB12_276; | |
st.local.v4.u32 [%rd2+512], {%r1128, %r1127, %r1126, %r1125}; | |
st.local.v4.u32 [%rd2+528], {%r15861, %r15862, %r15863, %r15864}; | |
mov.u32 %r13970, %r15864; | |
mov.u32 %r13972, %r15863; | |
mov.u32 %r13974, %r15862; | |
mov.u32 %r13976, %r15861; | |
mov.u32 %r15864, %r1125; | |
mov.u32 %r15863, %r1126; | |
mov.u32 %r15862, %r1127; | |
mov.u32 %r15861, %r1128; | |
mov.u32 %r15865, %r13976; | |
mov.u32 %r15866, %r13974; | |
mov.u32 %r15867, %r13972; | |
mov.u32 %r15868, %r13970; | |
BB12_276: | |
mov.u32 %r15845, %r15861; | |
mov.u32 %r15846, %r15862; | |
mov.u32 %r15847, %r15863; | |
mov.u32 %r15848, %r15864; | |
mov.u32 %r15849, %r15865; | |
mov.u32 %r15850, %r15866; | |
mov.u32 %r15851, %r15867; | |
mov.u32 %r15852, %r15868; | |
mul.lo.s64 %rd1413, %rd82, 1792; | |
add.s64 %rd1414, %rd6, %rd1413; | |
bfe.u32 %r6266, %r1101, 22, 6; | |
mul.wide.u32 %rd1415, %r6266, 28; | |
add.s64 %rd1416, %rd1414, %rd1415; | |
ld.global.u32 %r1137, [%rd1416+-8]; | |
and.b32 %r6267, %r1137, 65535; | |
mul.wide.u32 %rd1417, %r6267, 1792; | |
add.s64 %rd1418, %rd4, %rd1417; | |
cvt.u64.u32 %rd86, %r6267; | |
bfe.u32 %r6268, %r1137, 16, 6; | |
mul.wide.u32 %rd1419, %r6268, 28; | |
add.s64 %rd1420, %rd1418, %rd1419; | |
ld.global.u32 %r1138, [%rd1420+-12]; | |
and.b32 %r6269, %r1138, 65535; | |
cvt.u64.u32 %rd87, %r6269; | |
bfe.u32 %r6270, %r1138, 16, 6; | |
mul.wide.u32 %rd1421, %r6269, 1792; | |
add.s64 %rd1422, %rd415, %rd1421; | |
mul.wide.u32 %rd1423, %r6270, 28; | |
add.s64 %rd1424, %rd1422, %rd1423; | |
ld.global.u32 %r6271, [%rd1424]; | |
and.b32 %r6272, %r6271, 65535; | |
bfe.u32 %r6273, %r6271, 16, 6; | |
mul.wide.u32 %rd1425, %r6272, 1792; | |
add.s64 %rd1426, %rd414, %rd1425; | |
mul.wide.u32 %rd1427, %r6273, 28; | |
add.s64 %rd1428, %rd1426, %rd1427; | |
ld.global.u32 %r6274, [%rd1428]; | |
and.b32 %r6275, %r6274, 65535; | |
shl.b32 %r6276, %r6275, 6; | |
bfe.u32 %r6277, %r6274, 16, 6; | |
or.b32 %r1139, %r6276, %r6277; | |
st.local.u32 [%rd2+544], %r1139; | |
bfe.u32 %r6278, %r6271, 22, 6; | |
mul.wide.u32 %rd1429, %r6278, 28; | |
add.s64 %rd1430, %rd1426, %rd1429; | |
ld.global.u32 %r6279, [%rd1430]; | |
and.b32 %r6280, %r6279, 65535; | |
shl.b32 %r6281, %r6280, 6; | |
bfe.u32 %r6282, %r6279, 16, 6; | |
or.b32 %r15898, %r6281, %r6282; | |
st.local.u32 [%rd2+548], %r15898; | |
setp.le.u32 %p141, %r1139, %r15898; | |
mov.u32 %r15897, %r1139; | |
@%p141 bra BB12_278; | |
st.local.v2.u32 [%rd2+544], {%r15898, %r1139}; | |
mov.u32 %r14013, %r15898; | |
mov.u32 %r15898, %r1139; | |
mov.u32 %r15897, %r14013; | |
BB12_278: | |
mov.u32 %r15893, %r15897; | |
mov.u32 %r15894, %r15898; | |
bfe.u32 %r6283, %r1138, 22, 6; | |
mul.lo.s64 %rd1431, %rd87, 1792; | |
add.s64 %rd1432, %rd415, %rd1431; | |
mul.wide.u32 %rd1433, %r6283, 28; | |
add.s64 %rd1434, %rd1432, %rd1433; | |
ld.global.u32 %r6284, [%rd1434]; | |
and.b32 %r6285, %r6284, 65535; | |
bfe.u32 %r6286, %r6284, 16, 6; | |
mul.wide.u32 %rd1435, %r6285, 1792; | |
add.s64 %rd1436, %rd414, %rd1435; | |
mul.wide.u32 %rd1437, %r6286, 28; | |
add.s64 %rd1438, %rd1436, %rd1437; | |
ld.global.u32 %r6287, [%rd1438]; | |
and.b32 %r6288, %r6287, 65535; | |
shl.b32 %r6289, %r6288, 6; | |
bfe.u32 %r6290, %r6287, 16, 6; | |
or.b32 %r1143, %r6289, %r6290; | |
st.local.u32 [%rd2+552], %r1143; | |
bfe.u32 %r6291, %r6284, 22, 6; | |
mul.wide.u32 %rd1439, %r6291, 28; | |
add.s64 %rd1440, %rd1436, %rd1439; | |
ld.global.u32 %r6292, [%rd1440]; | |
and.b32 %r6293, %r6292, 65535; | |
shl.b32 %r6294, %r6293, 6; | |
bfe.u32 %r6295, %r6292, 16, 6; | |
or.b32 %r15900, %r6294, %r6295; | |
st.local.u32 [%rd2+556], %r15900; | |
setp.le.u32 %p142, %r1143, %r15900; | |
mov.u32 %r15899, %r1143; | |
@%p142 bra BB12_280; | |
st.local.v2.u32 [%rd2+552], {%r15900, %r1143}; | |
mov.u32 %r14019, %r15900; | |
mov.u32 %r15900, %r1143; | |
mov.u32 %r15899, %r14019; | |
BB12_280: | |
mov.u32 %r1146, %r15899; | |
mov.u32 %r1145, %r15900; | |
setp.le.u32 %p143, %r15893, %r1146; | |
mov.u32 %r15895, %r1146; | |
mov.u32 %r15896, %r1145; | |
@%p143 bra BB12_282; | |
st.local.v4.u32 [%rd2+544], {%r1146, %r1145, %r15893, %r15894}; | |
mov.u32 %r14016, %r15894; | |
mov.u32 %r14018, %r15893; | |
mov.u32 %r15894, %r1145; | |
mov.u32 %r15893, %r1146; | |
mov.u32 %r15895, %r14018; | |
mov.u32 %r15896, %r14016; | |
BB12_282: | |
mov.u32 %r15885, %r15893; | |
mov.u32 %r15886, %r15894; | |
mov.u32 %r15887, %r15895; | |
mov.u32 %r15888, %r15896; | |
mul.lo.s64 %rd1441, %rd86, 1792; | |
add.s64 %rd1442, %rd4, %rd1441; | |
bfe.u32 %r6296, %r1137, 22, 6; | |
mul.wide.u32 %rd1443, %r6296, 28; | |
add.s64 %rd1444, %rd1442, %rd1443; | |
ld.global.u32 %r1151, [%rd1444+-12]; | |
and.b32 %r6297, %r1151, 65535; | |
cvt.u64.u32 %rd88, %r6297; | |
bfe.u32 %r6298, %r1151, 16, 6; | |
mul.wide.u32 %rd1445, %r6297, 1792; | |
add.s64 %rd1446, %rd415, %rd1445; | |
mul.wide.u32 %rd1447, %r6298, 28; | |
add.s64 %rd1448, %rd1446, %rd1447; | |
ld.global.u32 %r6299, [%rd1448]; | |
and.b32 %r6300, %r6299, 65535; | |
bfe.u32 %r6301, %r6299, 16, 6; | |
mul.wide.u32 %rd1449, %r6300, 1792; | |
add.s64 %rd1450, %rd414, %rd1449; | |
mul.wide.u32 %rd1451, %r6301, 28; | |
add.s64 %rd1452, %rd1450, %rd1451; | |
ld.global.u32 %r6302, [%rd1452]; | |
and.b32 %r6303, %r6302, 65535; | |
shl.b32 %r6304, %r6303, 6; | |
bfe.u32 %r6305, %r6302, 16, 6; | |
or.b32 %r1152, %r6304, %r6305; | |
st.local.u32 [%rd2+560], %r1152; | |
bfe.u32 %r6306, %r6299, 22, 6; | |
mul.wide.u32 %rd1453, %r6306, 28; | |
add.s64 %rd1454, %rd1450, %rd1453; | |
ld.global.u32 %r6307, [%rd1454]; | |
and.b32 %r6308, %r6307, 65535; | |
shl.b32 %r6309, %r6308, 6; | |
bfe.u32 %r6310, %r6307, 16, 6; | |
or.b32 %r15906, %r6309, %r6310; | |
st.local.u32 [%rd2+564], %r15906; | |
setp.le.u32 %p144, %r1152, %r15906; | |
mov.u32 %r15905, %r1152; | |
@%p144 bra BB12_284; | |
st.local.v2.u32 [%rd2+560], {%r15906, %r1152}; | |
mov.u32 %r14033, %r15906; | |
mov.u32 %r15906, %r1152; | |
mov.u32 %r15905, %r14033; | |
BB12_284: | |
mov.u32 %r15901, %r15905; | |
mov.u32 %r15902, %r15906; | |
bfe.u32 %r6311, %r1151, 22, 6; | |
mul.lo.s64 %rd1455, %rd88, 1792; | |
add.s64 %rd1456, %rd415, %rd1455; | |
mul.wide.u32 %rd1457, %r6311, 28; | |
add.s64 %rd1458, %rd1456, %rd1457; | |
ld.global.u32 %r6312, [%rd1458]; | |
and.b32 %r6313, %r6312, 65535; | |
bfe.u32 %r6314, %r6312, 16, 6; | |
mul.wide.u32 %rd1459, %r6313, 1792; | |
add.s64 %rd1460, %rd414, %rd1459; | |
mul.wide.u32 %rd1461, %r6314, 28; | |
add.s64 %rd1462, %rd1460, %rd1461; | |
ld.global.u32 %r6315, [%rd1462]; | |
and.b32 %r6316, %r6315, 65535; | |
shl.b32 %r6317, %r6316, 6; | |
bfe.u32 %r6318, %r6315, 16, 6; | |
or.b32 %r1156, %r6317, %r6318; | |
st.local.u32 [%rd2+568], %r1156; | |
bfe.u32 %r6319, %r6312, 22, 6; | |
mul.wide.u32 %rd1463, %r6319, 28; | |
add.s64 %rd1464, %rd1460, %rd1463; | |
ld.global.u32 %r6320, [%rd1464]; | |
and.b32 %r6321, %r6320, 65535; | |
shl.b32 %r6322, %r6321, 6; | |
bfe.u32 %r6323, %r6320, 16, 6; | |
or.b32 %r15908, %r6322, %r6323; | |
st.local.u32 [%rd2+572], %r15908; | |
setp.le.u32 %p145, %r1156, %r15908; | |
mov.u32 %r15907, %r1156; | |
@%p145 bra BB12_286; | |
st.local.v2.u32 [%rd2+568], {%r15908, %r1156}; | |
mov.u32 %r14039, %r15908; | |
mov.u32 %r15908, %r1156; | |
mov.u32 %r15907, %r14039; | |
BB12_286: | |
mov.u32 %r1159, %r15907; | |
mov.u32 %r1158, %r15908; | |
setp.le.u32 %p146, %r15901, %r1159; | |
mov.u32 %r15903, %r1159; | |
mov.u32 %r15904, %r1158; | |
@%p146 bra BB12_288; | |
st.local.v4.u32 [%rd2+560], {%r1159, %r1158, %r15901, %r15902}; | |
mov.u32 %r14036, %r15902; | |
mov.u32 %r14038, %r15901; | |
mov.u32 %r15902, %r1158; | |
mov.u32 %r15901, %r1159; | |
mov.u32 %r15903, %r14038; | |
mov.u32 %r15904, %r14036; | |
BB12_288: | |
mov.u32 %r1163, %r15901; | |
mov.u32 %r1162, %r15902; | |
mov.u32 %r1161, %r15903; | |
mov.u32 %r1160, %r15904; | |
setp.le.u32 %p147, %r15885, %r1163; | |
mov.u32 %r15889, %r1163; | |
mov.u32 %r15890, %r1162; | |
mov.u32 %r15891, %r1161; | |
mov.u32 %r15892, %r1160; | |
@%p147 bra BB12_290; | |
st.local.v4.u32 [%rd2+544], {%r1163, %r1162, %r1161, %r1160}; | |
st.local.v4.u32 [%rd2+560], {%r15885, %r15886, %r15887, %r15888}; | |
mov.u32 %r14026, %r15888; | |
mov.u32 %r14028, %r15887; | |
mov.u32 %r14030, %r15886; | |
mov.u32 %r14032, %r15885; | |
mov.u32 %r15888, %r1160; | |
mov.u32 %r15887, %r1161; | |
mov.u32 %r15886, %r1162; | |
mov.u32 %r15885, %r1163; | |
mov.u32 %r15889, %r14032; | |
mov.u32 %r15890, %r14030; | |
mov.u32 %r15891, %r14028; | |
mov.u32 %r15892, %r14026; | |
BB12_290: | |
mov.u32 %r1171, %r15885; | |
mov.u32 %r1170, %r15886; | |
mov.u32 %r1169, %r15887; | |
mov.u32 %r1168, %r15888; | |
mov.u32 %r1167, %r15889; | |
mov.u32 %r1166, %r15890; | |
mov.u32 %r1165, %r15891; | |
mov.u32 %r1164, %r15892; | |
setp.le.u32 %p148, %r15845, %r1171; | |
mov.u32 %r15853, %r1171; | |
mov.u32 %r15854, %r1170; | |
mov.u32 %r15855, %r1169; | |
mov.u32 %r15856, %r1168; | |
mov.u32 %r15857, %r1167; | |
mov.u32 %r15858, %r1166; | |
mov.u32 %r15859, %r1165; | |
mov.u32 %r15860, %r1164; | |
@%p148 bra BB12_292; | |
st.local.v4.u32 [%rd2+512], {%r1171, %r1170, %r1169, %r1168}; | |
st.local.v4.u32 [%rd2+544], {%r15845, %r15846, %r15847, %r15848}; | |
st.local.v4.u32 [%rd2+528], {%r1167, %r1166, %r1165, %r1164}; | |
st.local.v4.u32 [%rd2+560], {%r15849, %r15850, %r15851, %r15852}; | |
mov.u32 %r13998, %r15852; | |
mov.u32 %r14000, %r15851; | |
mov.u32 %r14002, %r15850; | |
mov.u32 %r14004, %r15849; | |
mov.u32 %r14006, %r15848; | |
mov.u32 %r14008, %r15847; | |
mov.u32 %r14010, %r15846; | |
mov.u32 %r14012, %r15845; | |
mov.u32 %r15852, %r1164; | |
mov.u32 %r15851, %r1165; | |
mov.u32 %r15850, %r1166; | |
mov.u32 %r15849, %r1167; | |
mov.u32 %r15848, %r1168; | |
mov.u32 %r15847, %r1169; | |
mov.u32 %r15846, %r1170; | |
mov.u32 %r15845, %r1171; | |
mov.u32 %r15853, %r14012; | |
mov.u32 %r15854, %r14010; | |
mov.u32 %r15855, %r14008; | |
mov.u32 %r15856, %r14006; | |
mov.u32 %r15857, %r14004; | |
mov.u32 %r15858, %r14002; | |
mov.u32 %r15859, %r14000; | |
mov.u32 %r15860, %r13998; | |
BB12_292: | |
mov.u32 %r15813, %r15845; | |
mov.u32 %r15814, %r15846; | |
mov.u32 %r15815, %r15847; | |
mov.u32 %r15816, %r15848; | |
mov.u32 %r15817, %r15849; | |
mov.u32 %r15818, %r15850; | |
mov.u32 %r15819, %r15851; | |
mov.u32 %r15820, %r15852; | |
mov.u32 %r15821, %r15853; | |
mov.u32 %r15822, %r15854; | |
mov.u32 %r15823, %r15855; | |
mov.u32 %r15824, %r15856; | |
mov.u32 %r15825, %r15857; | |
mov.u32 %r15826, %r15858; | |
mov.u32 %r15827, %r15859; | |
mov.u32 %r15828, %r15860; | |
mul.lo.s64 %rd1465, %rd81, 1792; | |
add.s64 %rd1466, %rd4, %rd1465; | |
bfe.u32 %r6324, %r1100, 22, 6; | |
mul.wide.u32 %rd1467, %r6324, 28; | |
add.s64 %rd1468, %rd1466, %rd1467; | |
ld.global.u32 %r1188, [%rd1468+-8]; | |
and.b32 %r6325, %r1188, 65535; | |
mul.wide.u32 %rd1469, %r6325, 1792; | |
add.s64 %rd1470, %rd6, %rd1469; | |
bfe.u32 %r6326, %r1188, 16, 6; | |
mul.wide.u32 %rd1471, %r6326, 28; | |
add.s64 %rd1472, %rd1470, %rd1471; | |
ld.global.u32 %r1189, [%rd1472+-8]; | |
and.b32 %r6327, %r1189, 65535; | |
mul.wide.u32 %rd1473, %r6327, 1792; | |
add.s64 %rd1474, %rd4, %rd1473; | |
cvt.u64.u32 %rd89, %r6325; | |
cvt.u64.u32 %rd90, %r6327; | |
bfe.u32 %r6328, %r1189, 16, 6; | |
mul.wide.u32 %rd1475, %r6328, 28; | |
add.s64 %rd1476, %rd1474, %rd1475; | |
ld.global.u32 %r1190, [%rd1476+-12]; | |
and.b32 %r6329, %r1190, 65535; | |
cvt.u64.u32 %rd91, %r6329; | |
bfe.u32 %r6330, %r1190, 16, 6; | |
mul.wide.u32 %rd1477, %r6329, 1792; | |
add.s64 %rd1478, %rd415, %rd1477; | |
mul.wide.u32 %rd1479, %r6330, 28; | |
add.s64 %rd1480, %rd1478, %rd1479; | |
ld.global.u32 %r6331, [%rd1480]; | |
and.b32 %r6332, %r6331, 65535; | |
bfe.u32 %r6333, %r6331, 16, 6; | |
mul.wide.u32 %rd1481, %r6332, 1792; | |
add.s64 %rd1482, %rd414, %rd1481; | |
mul.wide.u32 %rd1483, %r6333, 28; | |
add.s64 %rd1484, %rd1482, %rd1483; | |
ld.global.u32 %r6334, [%rd1484]; | |
and.b32 %r6335, %r6334, 65535; | |
shl.b32 %r6336, %r6335, 6; | |
bfe.u32 %r6337, %r6334, 16, 6; | |
or.b32 %r1191, %r6336, %r6337; | |
st.local.u32 [%rd2+576], %r1191; | |
bfe.u32 %r6338, %r6331, 22, 6; | |
mul.wide.u32 %rd1485, %r6338, 28; | |
add.s64 %rd1486, %rd1482, %rd1485; | |
ld.global.u32 %r6339, [%rd1486]; | |
and.b32 %r6340, %r6339, 65535; | |
shl.b32 %r6341, %r6340, 6; | |
bfe.u32 %r6342, %r6339, 16, 6; | |
or.b32 %r15938, %r6341, %r6342; | |
st.local.u32 [%rd2+580], %r15938; | |
setp.le.u32 %p149, %r1191, %r15938; | |
mov.u32 %r15937, %r1191; | |
@%p149 bra BB12_294; | |
st.local.v2.u32 [%rd2+576], {%r15938, %r1191}; | |
mov.u32 %r14101, %r15938; | |
mov.u32 %r15938, %r1191; | |
mov.u32 %r15937, %r14101; | |
BB12_294: | |
mov.u32 %r15933, %r15937; | |
mov.u32 %r15934, %r15938; | |
bfe.u32 %r6343, %r1190, 22, 6; | |
mul.lo.s64 %rd1487, %rd91, 1792; | |
add.s64 %rd1488, %rd415, %rd1487; | |
mul.wide.u32 %rd1489, %r6343, 28; | |
add.s64 %rd1490, %rd1488, %rd1489; | |
ld.global.u32 %r6344, [%rd1490]; | |
and.b32 %r6345, %r6344, 65535; | |
bfe.u32 %r6346, %r6344, 16, 6; | |
mul.wide.u32 %rd1491, %r6345, 1792; | |
add.s64 %rd1492, %rd414, %rd1491; | |
mul.wide.u32 %rd1493, %r6346, 28; | |
add.s64 %rd1494, %rd1492, %rd1493; | |
ld.global.u32 %r6347, [%rd1494]; | |
and.b32 %r6348, %r6347, 65535; | |
shl.b32 %r6349, %r6348, 6; | |
bfe.u32 %r6350, %r6347, 16, 6; | |
or.b32 %r1195, %r6349, %r6350; | |
st.local.u32 [%rd2+584], %r1195; | |
bfe.u32 %r6351, %r6344, 22, 6; | |
mul.wide.u32 %rd1495, %r6351, 28; | |
add.s64 %rd1496, %rd1492, %rd1495; | |
ld.global.u32 %r6352, [%rd1496]; | |
and.b32 %r6353, %r6352, 65535; | |
shl.b32 %r6354, %r6353, 6; | |
bfe.u32 %r6355, %r6352, 16, 6; | |
or.b32 %r15940, %r6354, %r6355; | |
st.local.u32 [%rd2+588], %r15940; | |
setp.le.u32 %p150, %r1195, %r15940; | |
mov.u32 %r15939, %r1195; | |
@%p150 bra BB12_296; | |
st.local.v2.u32 [%rd2+584], {%r15940, %r1195}; | |
mov.u32 %r14107, %r15940; | |
mov.u32 %r15940, %r1195; | |
mov.u32 %r15939, %r14107; | |
BB12_296: | |
mov.u32 %r1198, %r15939; | |
mov.u32 %r1197, %r15940; | |
setp.le.u32 %p151, %r15933, %r1198; | |
mov.u32 %r15935, %r1198; | |
mov.u32 %r15936, %r1197; | |
@%p151 bra BB12_298; | |
st.local.v4.u32 [%rd2+576], {%r1198, %r1197, %r15933, %r15934}; | |
mov.u32 %r14104, %r15934; | |
mov.u32 %r14106, %r15933; | |
mov.u32 %r15934, %r1197; | |
mov.u32 %r15933, %r1198; | |
mov.u32 %r15935, %r14106; | |
mov.u32 %r15936, %r14104; | |
BB12_298: | |
mov.u32 %r15925, %r15933; | |
mov.u32 %r15926, %r15934; | |
mov.u32 %r15927, %r15935; | |
mov.u32 %r15928, %r15936; | |
mul.lo.s64 %rd1497, %rd90, 1792; | |
add.s64 %rd1498, %rd4, %rd1497; | |
bfe.u32 %r6356, %r1189, 22, 6; | |
mul.wide.u32 %rd1499, %r6356, 28; | |
add.s64 %rd1500, %rd1498, %rd1499; | |
ld.global.u32 %r1203, [%rd1500+-12]; | |
and.b32 %r6357, %r1203, 65535; | |
cvt.u64.u32 %rd92, %r6357; | |
bfe.u32 %r6358, %r1203, 16, 6; | |
mul.wide.u32 %rd1501, %r6357, 1792; | |
add.s64 %rd1502, %rd415, %rd1501; | |
mul.wide.u32 %rd1503, %r6358, 28; | |
add.s64 %rd1504, %rd1502, %rd1503; | |
ld.global.u32 %r6359, [%rd1504]; | |
and.b32 %r6360, %r6359, 65535; | |
bfe.u32 %r6361, %r6359, 16, 6; | |
mul.wide.u32 %rd1505, %r6360, 1792; | |
add.s64 %rd1506, %rd414, %rd1505; | |
mul.wide.u32 %rd1507, %r6361, 28; | |
add.s64 %rd1508, %rd1506, %rd1507; | |
ld.global.u32 %r6362, [%rd1508]; | |
and.b32 %r6363, %r6362, 65535; | |
shl.b32 %r6364, %r6363, 6; | |
bfe.u32 %r6365, %r6362, 16, 6; | |
or.b32 %r1204, %r6364, %r6365; | |
st.local.u32 [%rd2+592], %r1204; | |
bfe.u32 %r6366, %r6359, 22, 6; | |
mul.wide.u32 %rd1509, %r6366, 28; | |
add.s64 %rd1510, %rd1506, %rd1509; | |
ld.global.u32 %r6367, [%rd1510]; | |
and.b32 %r6368, %r6367, 65535; | |
shl.b32 %r6369, %r6368, 6; | |
bfe.u32 %r6370, %r6367, 16, 6; | |
or.b32 %r15946, %r6369, %r6370; | |
st.local.u32 [%rd2+596], %r15946; | |
setp.le.u32 %p152, %r1204, %r15946; | |
mov.u32 %r15945, %r1204; | |
@%p152 bra BB12_300; | |
st.local.v2.u32 [%rd2+592], {%r15946, %r1204}; | |
mov.u32 %r14121, %r15946; | |
mov.u32 %r15946, %r1204; | |
mov.u32 %r15945, %r14121; | |
BB12_300: | |
mov.u32 %r15941, %r15945; | |
mov.u32 %r15942, %r15946; | |
bfe.u32 %r6371, %r1203, 22, 6; | |
mul.lo.s64 %rd1511, %rd92, 1792; | |
add.s64 %rd1512, %rd415, %rd1511; | |
mul.wide.u32 %rd1513, %r6371, 28; | |
add.s64 %rd1514, %rd1512, %rd1513; | |
ld.global.u32 %r6372, [%rd1514]; | |
and.b32 %r6373, %r6372, 65535; | |
bfe.u32 %r6374, %r6372, 16, 6; | |
mul.wide.u32 %rd1515, %r6373, 1792; | |
add.s64 %rd1516, %rd414, %rd1515; | |
mul.wide.u32 %rd1517, %r6374, 28; | |
add.s64 %rd1518, %rd1516, %rd1517; | |
ld.global.u32 %r6375, [%rd1518]; | |
and.b32 %r6376, %r6375, 65535; | |
shl.b32 %r6377, %r6376, 6; | |
bfe.u32 %r6378, %r6375, 16, 6; | |
or.b32 %r1208, %r6377, %r6378; | |
st.local.u32 [%rd2+600], %r1208; | |
bfe.u32 %r6379, %r6372, 22, 6; | |
mul.wide.u32 %rd1519, %r6379, 28; | |
add.s64 %rd1520, %rd1516, %rd1519; | |
ld.global.u32 %r6380, [%rd1520]; | |
and.b32 %r6381, %r6380, 65535; | |
shl.b32 %r6382, %r6381, 6; | |
bfe.u32 %r6383, %r6380, 16, 6; | |
or.b32 %r15948, %r6382, %r6383; | |
st.local.u32 [%rd2+604], %r15948; | |
setp.le.u32 %p153, %r1208, %r15948; | |
mov.u32 %r15947, %r1208; | |
@%p153 bra BB12_302; | |
st.local.v2.u32 [%rd2+600], {%r15948, %r1208}; | |
mov.u32 %r14127, %r15948; | |
mov.u32 %r15948, %r1208; | |
mov.u32 %r15947, %r14127; | |
BB12_302: | |
mov.u32 %r1211, %r15947; | |
mov.u32 %r1210, %r15948; | |
setp.le.u32 %p154, %r15941, %r1211; | |
mov.u32 %r15943, %r1211; | |
mov.u32 %r15944, %r1210; | |
@%p154 bra BB12_304; | |
st.local.v4.u32 [%rd2+592], {%r1211, %r1210, %r15941, %r15942}; | |
mov.u32 %r14124, %r15942; | |
mov.u32 %r14126, %r15941; | |
mov.u32 %r15942, %r1210; | |
mov.u32 %r15941, %r1211; | |
mov.u32 %r15943, %r14126; | |
mov.u32 %r15944, %r14124; | |
BB12_304: | |
mov.u32 %r1215, %r15941; | |
mov.u32 %r1214, %r15942; | |
mov.u32 %r1213, %r15943; | |
mov.u32 %r1212, %r15944; | |
setp.le.u32 %p155, %r15925, %r1215; | |
mov.u32 %r15929, %r1215; | |
mov.u32 %r15930, %r1214; | |
mov.u32 %r15931, %r1213; | |
mov.u32 %r15932, %r1212; | |
@%p155 bra BB12_306; | |
st.local.v4.u32 [%rd2+576], {%r1215, %r1214, %r1213, %r1212}; | |
st.local.v4.u32 [%rd2+592], {%r15925, %r15926, %r15927, %r15928}; | |
mov.u32 %r14114, %r15928; | |
mov.u32 %r14116, %r15927; | |
mov.u32 %r14118, %r15926; | |
mov.u32 %r14120, %r15925; | |
mov.u32 %r15928, %r1212; | |
mov.u32 %r15927, %r1213; | |
mov.u32 %r15926, %r1214; | |
mov.u32 %r15925, %r1215; | |
mov.u32 %r15929, %r14120; | |
mov.u32 %r15930, %r14118; | |
mov.u32 %r15931, %r14116; | |
mov.u32 %r15932, %r14114; | |
BB12_306: | |
mov.u32 %r15909, %r15925; | |
mov.u32 %r15910, %r15926; | |
mov.u32 %r15911, %r15927; | |
mov.u32 %r15912, %r15928; | |
mov.u32 %r15913, %r15929; | |
mov.u32 %r15914, %r15930; | |
mov.u32 %r15915, %r15931; | |
mov.u32 %r15916, %r15932; | |
mul.lo.s64 %rd1521, %rd89, 1792; | |
add.s64 %rd1522, %rd6, %rd1521; | |
bfe.u32 %r6384, %r1188, 22, 6; | |
mul.wide.u32 %rd1523, %r6384, 28; | |
add.s64 %rd1524, %rd1522, %rd1523; | |
ld.global.u32 %r1224, [%rd1524+-8]; | |
and.b32 %r6385, %r1224, 65535; | |
mul.wide.u32 %rd1525, %r6385, 1792; | |
add.s64 %rd1526, %rd4, %rd1525; | |
cvt.u64.u32 %rd93, %r6385; | |
bfe.u32 %r6386, %r1224, 16, 6; | |
mul.wide.u32 %rd1527, %r6386, 28; | |
add.s64 %rd1528, %rd1526, %rd1527; | |
ld.global.u32 %r1225, [%rd1528+-12]; | |
and.b32 %r6387, %r1225, 65535; | |
cvt.u64.u32 %rd94, %r6387; | |
bfe.u32 %r6388, %r1225, 16, 6; | |
mul.wide.u32 %rd1529, %r6387, 1792; | |
add.s64 %rd1530, %rd415, %rd1529; | |
mul.wide.u32 %rd1531, %r6388, 28; | |
add.s64 %rd1532, %rd1530, %rd1531; | |
ld.global.u32 %r6389, [%rd1532]; | |
and.b32 %r6390, %r6389, 65535; | |
bfe.u32 %r6391, %r6389, 16, 6; | |
mul.wide.u32 %rd1533, %r6390, 1792; | |
add.s64 %rd1534, %rd414, %rd1533; | |
mul.wide.u32 %rd1535, %r6391, 28; | |
add.s64 %rd1536, %rd1534, %rd1535; | |
ld.global.u32 %r6392, [%rd1536]; | |
and.b32 %r6393, %r6392, 65535; | |
shl.b32 %r6394, %r6393, 6; | |
bfe.u32 %r6395, %r6392, 16, 6; | |
or.b32 %r1226, %r6394, %r6395; | |
st.local.u32 [%rd2+608], %r1226; | |
bfe.u32 %r6396, %r6389, 22, 6; | |
mul.wide.u32 %rd1537, %r6396, 28; | |
add.s64 %rd1538, %rd1534, %rd1537; | |
ld.global.u32 %r6397, [%rd1538]; | |
and.b32 %r6398, %r6397, 65535; | |
shl.b32 %r6399, %r6398, 6; | |
bfe.u32 %r6400, %r6397, 16, 6; | |
or.b32 %r15962, %r6399, %r6400; | |
st.local.u32 [%rd2+612], %r15962; | |
setp.le.u32 %p156, %r1226, %r15962; | |
mov.u32 %r15961, %r1226; | |
@%p156 bra BB12_308; | |
st.local.v2.u32 [%rd2+608], {%r15962, %r1226}; | |
mov.u32 %r14157, %r15962; | |
mov.u32 %r15962, %r1226; | |
mov.u32 %r15961, %r14157; | |
BB12_308: | |
mov.u32 %r15957, %r15961; | |
mov.u32 %r15958, %r15962; | |
bfe.u32 %r6401, %r1225, 22, 6; | |
mul.lo.s64 %rd1539, %rd94, 1792; | |
add.s64 %rd1540, %rd415, %rd1539; | |
mul.wide.u32 %rd1541, %r6401, 28; | |
add.s64 %rd1542, %rd1540, %rd1541; | |
ld.global.u32 %r6402, [%rd1542]; | |
and.b32 %r6403, %r6402, 65535; | |
bfe.u32 %r6404, %r6402, 16, 6; | |
mul.wide.u32 %rd1543, %r6403, 1792; | |
add.s64 %rd1544, %rd414, %rd1543; | |
mul.wide.u32 %rd1545, %r6404, 28; | |
add.s64 %rd1546, %rd1544, %rd1545; | |
ld.global.u32 %r6405, [%rd1546]; | |
and.b32 %r6406, %r6405, 65535; | |
shl.b32 %r6407, %r6406, 6; | |
bfe.u32 %r6408, %r6405, 16, 6; | |
or.b32 %r1230, %r6407, %r6408; | |
st.local.u32 [%rd2+616], %r1230; | |
bfe.u32 %r6409, %r6402, 22, 6; | |
mul.wide.u32 %rd1547, %r6409, 28; | |
add.s64 %rd1548, %rd1544, %rd1547; | |
ld.global.u32 %r6410, [%rd1548]; | |
and.b32 %r6411, %r6410, 65535; | |
shl.b32 %r6412, %r6411, 6; | |
bfe.u32 %r6413, %r6410, 16, 6; | |
or.b32 %r15964, %r6412, %r6413; | |
st.local.u32 [%rd2+620], %r15964; | |
setp.le.u32 %p157, %r1230, %r15964; | |
mov.u32 %r15963, %r1230; | |
@%p157 bra BB12_310; | |
st.local.v2.u32 [%rd2+616], {%r15964, %r1230}; | |
mov.u32 %r14163, %r15964; | |
mov.u32 %r15964, %r1230; | |
mov.u32 %r15963, %r14163; | |
BB12_310: | |
mov.u32 %r1233, %r15963; | |
mov.u32 %r1232, %r15964; | |
setp.le.u32 %p158, %r15957, %r1233; | |
mov.u32 %r15959, %r1233; | |
mov.u32 %r15960, %r1232; | |
@%p158 bra BB12_312; | |
st.local.v4.u32 [%rd2+608], {%r1233, %r1232, %r15957, %r15958}; | |
mov.u32 %r14160, %r15958; | |
mov.u32 %r14162, %r15957; | |
mov.u32 %r15958, %r1232; | |
mov.u32 %r15957, %r1233; | |
mov.u32 %r15959, %r14162; | |
mov.u32 %r15960, %r14160; | |
BB12_312: | |
mov.u32 %r15949, %r15957; | |
mov.u32 %r15950, %r15958; | |
mov.u32 %r15951, %r15959; | |
mov.u32 %r15952, %r15960; | |
mul.lo.s64 %rd1549, %rd93, 1792; | |
add.s64 %rd1550, %rd4, %rd1549; | |
bfe.u32 %r6414, %r1224, 22, 6; | |
mul.wide.u32 %rd1551, %r6414, 28; | |
add.s64 %rd1552, %rd1550, %rd1551; | |
ld.global.u32 %r1238, [%rd1552+-12]; | |
and.b32 %r6415, %r1238, 65535; | |
cvt.u64.u32 %rd95, %r6415; | |
bfe.u32 %r6416, %r1238, 16, 6; | |
mul.wide.u32 %rd1553, %r6415, 1792; | |
add.s64 %rd1554, %rd415, %rd1553; | |
mul.wide.u32 %rd1555, %r6416, 28; | |
add.s64 %rd1556, %rd1554, %rd1555; | |
ld.global.u32 %r6417, [%rd1556]; | |
and.b32 %r6418, %r6417, 65535; | |
bfe.u32 %r6419, %r6417, 16, 6; | |
mul.wide.u32 %rd1557, %r6418, 1792; | |
add.s64 %rd1558, %rd414, %rd1557; | |
mul.wide.u32 %rd1559, %r6419, 28; | |
add.s64 %rd1560, %rd1558, %rd1559; | |
ld.global.u32 %r6420, [%rd1560]; | |
and.b32 %r6421, %r6420, 65535; | |
shl.b32 %r6422, %r6421, 6; | |
bfe.u32 %r6423, %r6420, 16, 6; | |
or.b32 %r1239, %r6422, %r6423; | |
st.local.u32 [%rd2+624], %r1239; | |
bfe.u32 %r6424, %r6417, 22, 6; | |
mul.wide.u32 %rd1561, %r6424, 28; | |
add.s64 %rd1562, %rd1558, %rd1561; | |
ld.global.u32 %r6425, [%rd1562]; | |
and.b32 %r6426, %r6425, 65535; | |
shl.b32 %r6427, %r6426, 6; | |
bfe.u32 %r6428, %r6425, 16, 6; | |
or.b32 %r15970, %r6427, %r6428; | |
st.local.u32 [%rd2+628], %r15970; | |
setp.le.u32 %p159, %r1239, %r15970; | |
mov.u32 %r15969, %r1239; | |
@%p159 bra BB12_314; | |
st.local.v2.u32 [%rd2+624], {%r15970, %r1239}; | |
mov.u32 %r14177, %r15970; | |
mov.u32 %r15970, %r1239; | |
mov.u32 %r15969, %r14177; | |
BB12_314: | |
mov.u32 %r15965, %r15969; | |
mov.u32 %r15966, %r15970; | |
bfe.u32 %r6429, %r1238, 22, 6; | |
mul.lo.s64 %rd1563, %rd95, 1792; | |
add.s64 %rd1564, %rd415, %rd1563; | |
mul.wide.u32 %rd1565, %r6429, 28; | |
add.s64 %rd1566, %rd1564, %rd1565; | |
ld.global.u32 %r6430, [%rd1566]; | |
and.b32 %r6431, %r6430, 65535; | |
bfe.u32 %r6432, %r6430, 16, 6; | |
mul.wide.u32 %rd1567, %r6431, 1792; | |
add.s64 %rd1568, %rd414, %rd1567; | |
mul.wide.u32 %rd1569, %r6432, 28; | |
add.s64 %rd1570, %rd1568, %rd1569; | |
ld.global.u32 %r6433, [%rd1570]; | |
and.b32 %r6434, %r6433, 65535; | |
shl.b32 %r6435, %r6434, 6; | |
bfe.u32 %r6436, %r6433, 16, 6; | |
or.b32 %r1243, %r6435, %r6436; | |
st.local.u32 [%rd2+632], %r1243; | |
bfe.u32 %r6437, %r6430, 22, 6; | |
mul.wide.u32 %rd1571, %r6437, 28; | |
add.s64 %rd1572, %rd1568, %rd1571; | |
ld.global.u32 %r6438, [%rd1572]; | |
and.b32 %r6439, %r6438, 65535; | |
shl.b32 %r6440, %r6439, 6; | |
bfe.u32 %r6441, %r6438, 16, 6; | |
or.b32 %r15972, %r6440, %r6441; | |
st.local.u32 [%rd2+636], %r15972; | |
setp.le.u32 %p160, %r1243, %r15972; | |
mov.u32 %r15971, %r1243; | |
@%p160 bra BB12_316; | |
st.local.v2.u32 [%rd2+632], {%r15972, %r1243}; | |
mov.u32 %r14183, %r15972; | |
mov.u32 %r15972, %r1243; | |
mov.u32 %r15971, %r14183; | |
BB12_316: | |
mov.u32 %r1246, %r15971; | |
mov.u32 %r1245, %r15972; | |
setp.le.u32 %p161, %r15965, %r1246; | |
mov.u32 %r15967, %r1246; | |
mov.u32 %r15968, %r1245; | |
@%p161 bra BB12_318; | |
st.local.v4.u32 [%rd2+624], {%r1246, %r1245, %r15965, %r15966}; | |
mov.u32 %r14180, %r15966; | |
mov.u32 %r14182, %r15965; | |
mov.u32 %r15966, %r1245; | |
mov.u32 %r15965, %r1246; | |
mov.u32 %r15967, %r14182; | |
mov.u32 %r15968, %r14180; | |
BB12_318: | |
mov.u32 %r1250, %r15965; | |
mov.u32 %r1249, %r15966; | |
mov.u32 %r1248, %r15967; | |
mov.u32 %r1247, %r15968; | |
setp.le.u32 %p162, %r15949, %r1250; | |
mov.u32 %r15953, %r1250; | |
mov.u32 %r15954, %r1249; | |
mov.u32 %r15955, %r1248; | |
mov.u32 %r15956, %r1247; | |
@%p162 bra BB12_320; | |
st.local.v4.u32 [%rd2+608], {%r1250, %r1249, %r1248, %r1247}; | |
st.local.v4.u32 [%rd2+624], {%r15949, %r15950, %r15951, %r15952}; | |
mov.u32 %r14170, %r15952; | |
mov.u32 %r14172, %r15951; | |
mov.u32 %r14174, %r15950; | |
mov.u32 %r14176, %r15949; | |
mov.u32 %r15952, %r1247; | |
mov.u32 %r15951, %r1248; | |
mov.u32 %r15950, %r1249; | |
mov.u32 %r15949, %r1250; | |
mov.u32 %r15953, %r14176; | |
mov.u32 %r15954, %r14174; | |
mov.u32 %r15955, %r14172; | |
mov.u32 %r15956, %r14170; | |
BB12_320: | |
mov.u32 %r1258, %r15949; | |
mov.u32 %r1257, %r15950; | |
mov.u32 %r1256, %r15951; | |
mov.u32 %r1255, %r15952; | |
mov.u32 %r1254, %r15953; | |
mov.u32 %r1253, %r15954; | |
mov.u32 %r1252, %r15955; | |
mov.u32 %r1251, %r15956; | |
setp.le.u32 %p163, %r15909, %r1258; | |
mov.u32 %r15917, %r1258; | |
mov.u32 %r15918, %r1257; | |
mov.u32 %r15919, %r1256; | |
mov.u32 %r15920, %r1255; | |
mov.u32 %r15921, %r1254; | |
mov.u32 %r15922, %r1253; | |
mov.u32 %r15923, %r1252; | |
mov.u32 %r15924, %r1251; | |
@%p163 bra BB12_322; | |
st.local.v4.u32 [%rd2+576], {%r1258, %r1257, %r1256, %r1255}; | |
st.local.v4.u32 [%rd2+608], {%r15909, %r15910, %r15911, %r15912}; | |
st.local.v4.u32 [%rd2+592], {%r1254, %r1253, %r1252, %r1251}; | |
st.local.v4.u32 [%rd2+624], {%r15913, %r15914, %r15915, %r15916}; | |
mov.u32 %r14142, %r15916; | |
mov.u32 %r14144, %r15915; | |
mov.u32 %r14146, %r15914; | |
mov.u32 %r14148, %r15913; | |
mov.u32 %r14150, %r15912; | |
mov.u32 %r14152, %r15911; | |
mov.u32 %r14154, %r15910; | |
mov.u32 %r14156, %r15909; | |
mov.u32 %r15916, %r1251; | |
mov.u32 %r15915, %r1252; | |
mov.u32 %r15914, %r1253; | |
mov.u32 %r15913, %r1254; | |
mov.u32 %r15912, %r1255; | |
mov.u32 %r15911, %r1256; | |
mov.u32 %r15910, %r1257; | |
mov.u32 %r15909, %r1258; | |
mov.u32 %r15917, %r14156; | |
mov.u32 %r15918, %r14154; | |
mov.u32 %r15919, %r14152; | |
mov.u32 %r15920, %r14150; | |
mov.u32 %r15921, %r14148; | |
mov.u32 %r15922, %r14146; | |
mov.u32 %r15923, %r14144; | |
mov.u32 %r15924, %r14142; | |
BB12_322: | |
mov.u32 %r1274, %r15909; | |
mov.u32 %r1273, %r15910; | |
mov.u32 %r1272, %r15911; | |
mov.u32 %r1271, %r15912; | |
mov.u32 %r1270, %r15913; | |
mov.u32 %r1269, %r15914; | |
mov.u32 %r1268, %r15915; | |
mov.u32 %r1267, %r15916; | |
mov.u32 %r1266, %r15917; | |
mov.u32 %r1265, %r15918; | |
mov.u32 %r1264, %r15919; | |
mov.u32 %r1263, %r15920; | |
mov.u32 %r1262, %r15921; | |
mov.u32 %r1261, %r15922; | |
mov.u32 %r1260, %r15923; | |
mov.u32 %r1259, %r15924; | |
setp.le.u32 %p164, %r15813, %r1274; | |
mov.u32 %r15829, %r1274; | |
mov.u32 %r15830, %r1273; | |
mov.u32 %r15831, %r1272; | |
mov.u32 %r15832, %r1271; | |
mov.u32 %r15833, %r1270; | |
mov.u32 %r15834, %r1269; | |
mov.u32 %r15835, %r1268; | |
mov.u32 %r15836, %r1267; | |
mov.u32 %r15837, %r1266; | |
mov.u32 %r15838, %r1265; | |
mov.u32 %r15839, %r1264; | |
mov.u32 %r15840, %r1263; | |
mov.u32 %r15841, %r1262; | |
mov.u32 %r15842, %r1261; | |
mov.u32 %r15843, %r1260; | |
mov.u32 %r15844, %r1259; | |
@%p164 bra BB12_324; | |
st.local.v4.u32 [%rd2+512], {%r1274, %r1273, %r1272, %r1271}; | |
st.local.v4.u32 [%rd2+576], {%r15813, %r15814, %r15815, %r15816}; | |
st.local.v4.u32 [%rd2+528], {%r1270, %r1269, %r1268, %r1267}; | |
st.local.v4.u32 [%rd2+592], {%r15817, %r15818, %r15819, %r15820}; | |
st.local.v4.u32 [%rd2+544], {%r1266, %r1265, %r1264, %r1263}; | |
st.local.v4.u32 [%rd2+608], {%r15821, %r15822, %r15823, %r15824}; | |
st.local.v4.u32 [%rd2+560], {%r1262, %r1261, %r1260, %r1259}; | |
st.local.v4.u32 [%rd2+624], {%r15825, %r15826, %r15827, %r15828}; | |
mov.u32 %r14070, %r15828; | |
mov.u32 %r14072, %r15827; | |
mov.u32 %r14074, %r15826; | |
mov.u32 %r14076, %r15825; | |
mov.u32 %r14078, %r15824; | |
mov.u32 %r14080, %r15823; | |
mov.u32 %r14082, %r15822; | |
mov.u32 %r14084, %r15821; | |
mov.u32 %r14086, %r15820; | |
mov.u32 %r14088, %r15819; | |
mov.u32 %r14090, %r15818; | |
mov.u32 %r14092, %r15817; | |
mov.u32 %r14094, %r15816; | |
mov.u32 %r14096, %r15815; | |
mov.u32 %r14098, %r15814; | |
mov.u32 %r14100, %r15813; | |
mov.u32 %r15828, %r1259; | |
mov.u32 %r15827, %r1260; | |
mov.u32 %r15826, %r1261; | |
mov.u32 %r15825, %r1262; | |
mov.u32 %r15824, %r1263; | |
mov.u32 %r15823, %r1264; | |
mov.u32 %r15822, %r1265; | |
mov.u32 %r15821, %r1266; | |
mov.u32 %r15820, %r1267; | |
mov.u32 %r15819, %r1268; | |
mov.u32 %r15818, %r1269; | |
mov.u32 %r15817, %r1270; | |
mov.u32 %r15816, %r1271; | |
mov.u32 %r15815, %r1272; | |
mov.u32 %r15814, %r1273; | |
mov.u32 %r15813, %r1274; | |
mov.u32 %r15829, %r14100; | |
mov.u32 %r15830, %r14098; | |
mov.u32 %r15831, %r14096; | |
mov.u32 %r15832, %r14094; | |
mov.u32 %r15833, %r14092; | |
mov.u32 %r15834, %r14090; | |
mov.u32 %r15835, %r14088; | |
mov.u32 %r15836, %r14086; | |
mov.u32 %r15837, %r14084; | |
mov.u32 %r15838, %r14082; | |
mov.u32 %r15839, %r14080; | |
mov.u32 %r15840, %r14078; | |
mov.u32 %r15841, %r14076; | |
mov.u32 %r15842, %r14074; | |
mov.u32 %r15843, %r14072; | |
mov.u32 %r15844, %r14070; | |
BB12_324: | |
mov.u32 %r15749, %r15813; | |
mov.u32 %r15750, %r15814; | |
mov.u32 %r15751, %r15815; | |
mov.u32 %r15752, %r15816; | |
mov.u32 %r15753, %r15817; | |
mov.u32 %r15754, %r15818; | |
mov.u32 %r15755, %r15819; | |
mov.u32 %r15756, %r15820; | |
mov.u32 %r15757, %r15821; | |
mov.u32 %r15758, %r15822; | |
mov.u32 %r15759, %r15823; | |
mov.u32 %r15760, %r15824; | |
mov.u32 %r15761, %r15825; | |
mov.u32 %r15762, %r15826; | |
mov.u32 %r15763, %r15827; | |
mov.u32 %r15764, %r15828; | |
mov.u32 %r15765, %r15829; | |
mov.u32 %r15766, %r15830; | |
mov.u32 %r15767, %r15831; | |
mov.u32 %r15768, %r15832; | |
mov.u32 %r15769, %r15833; | |
mov.u32 %r15770, %r15834; | |
mov.u32 %r15771, %r15835; | |
mov.u32 %r15772, %r15836; | |
mov.u32 %r15773, %r15837; | |
mov.u32 %r15774, %r15838; | |
mov.u32 %r15775, %r15839; | |
mov.u32 %r15776, %r15840; | |
mov.u32 %r15777, %r15841; | |
mov.u32 %r15778, %r15842; | |
mov.u32 %r15779, %r15843; | |
mov.u32 %r15780, %r15844; | |
mul.lo.s64 %rd1573, %rd80, 1792; | |
add.s64 %rd1574, %rd6, %rd1573; | |
bfe.u32 %r6442, %r1099, 22, 6; | |
mul.wide.u32 %rd1575, %r6442, 28; | |
add.s64 %rd1576, %rd1574, %rd1575; | |
ld.global.u32 %r1307, [%rd1576+-4]; | |
and.b32 %r6443, %r1307, 65535; | |
mul.wide.u32 %rd1577, %r6443, 1792; | |
add.s64 %rd1578, %rd4, %rd1577; | |
bfe.u32 %r6444, %r1307, 16, 6; | |
mul.wide.u32 %rd1579, %r6444, 28; | |
add.s64 %rd1580, %rd1578, %rd1579; | |
ld.global.u32 %r1308, [%rd1580+-8]; | |
and.b32 %r6445, %r1308, 65535; | |
mul.wide.u32 %rd1581, %r6445, 1792; | |
add.s64 %rd1582, %rd6, %rd1581; | |
bfe.u32 %r6446, %r1308, 16, 6; | |
mul.wide.u32 %rd1583, %r6446, 28; | |
add.s64 %rd1584, %rd1582, %rd1583; | |
ld.global.u32 %r1309, [%rd1584+-8]; | |
and.b32 %r6447, %r1309, 65535; | |
mul.wide.u32 %rd1585, %r6447, 1792; | |
add.s64 %rd1586, %rd4, %rd1585; | |
cvt.u64.u32 %rd96, %r6443; | |
cvt.u64.u32 %rd97, %r6445; | |
cvt.u64.u32 %rd98, %r6447; | |
bfe.u32 %r6448, %r1309, 16, 6; | |
mul.wide.u32 %rd1587, %r6448, 28; | |
add.s64 %rd1588, %rd1586, %rd1587; | |
ld.global.u32 %r1310, [%rd1588+-12]; | |
and.b32 %r6449, %r1310, 65535; | |
cvt.u64.u32 %rd99, %r6449; | |
bfe.u32 %r6450, %r1310, 16, 6; | |
mul.wide.u32 %rd1589, %r6449, 1792; | |
add.s64 %rd1590, %rd415, %rd1589; | |
mul.wide.u32 %rd1591, %r6450, 28; | |
add.s64 %rd1592, %rd1590, %rd1591; | |
ld.global.u32 %r6451, [%rd1592]; | |
and.b32 %r6452, %r6451, 65535; | |
bfe.u32 %r6453, %r6451, 16, 6; | |
mul.wide.u32 %rd1593, %r6452, 1792; | |
add.s64 %rd1594, %rd414, %rd1593; | |
mul.wide.u32 %rd1595, %r6453, 28; | |
add.s64 %rd1596, %rd1594, %rd1595; | |
ld.global.u32 %r6454, [%rd1596]; | |
and.b32 %r6455, %r6454, 65535; | |
shl.b32 %r6456, %r6455, 6; | |
bfe.u32 %r6457, %r6454, 16, 6; | |
or.b32 %r1311, %r6456, %r6457; | |
st.local.u32 [%rd2+640], %r1311; | |
bfe.u32 %r6458, %r6451, 22, 6; | |
mul.wide.u32 %rd1597, %r6458, 28; | |
add.s64 %rd1598, %rd1594, %rd1597; | |
ld.global.u32 %r6459, [%rd1598]; | |
and.b32 %r6460, %r6459, 65535; | |
shl.b32 %r6461, %r6460, 6; | |
bfe.u32 %r6462, %r6459, 16, 6; | |
or.b32 %r16034, %r6461, %r6462; | |
st.local.u32 [%rd2+644], %r16034; | |
setp.le.u32 %p165, %r1311, %r16034; | |
mov.u32 %r16033, %r1311; | |
@%p165 bra BB12_326; | |
st.local.v2.u32 [%rd2+640], {%r16034, %r1311}; | |
mov.u32 %r14309, %r16034; | |
mov.u32 %r16034, %r1311; | |
mov.u32 %r16033, %r14309; | |
BB12_326: | |
mov.u32 %r16029, %r16033; | |
mov.u32 %r16030, %r16034; | |
bfe.u32 %r6463, %r1310, 22, 6; | |
mul.lo.s64 %rd1599, %rd99, 1792; | |
add.s64 %rd1600, %rd415, %rd1599; | |
mul.wide.u32 %rd1601, %r6463, 28; | |
add.s64 %rd1602, %rd1600, %rd1601; | |
ld.global.u32 %r6464, [%rd1602]; | |
and.b32 %r6465, %r6464, 65535; | |
bfe.u32 %r6466, %r6464, 16, 6; | |
mul.wide.u32 %rd1603, %r6465, 1792; | |
add.s64 %rd1604, %rd414, %rd1603; | |
mul.wide.u32 %rd1605, %r6466, 28; | |
add.s64 %rd1606, %rd1604, %rd1605; | |
ld.global.u32 %r6467, [%rd1606]; | |
and.b32 %r6468, %r6467, 65535; | |
shl.b32 %r6469, %r6468, 6; | |
bfe.u32 %r6470, %r6467, 16, 6; | |
or.b32 %r1315, %r6469, %r6470; | |
st.local.u32 [%rd2+648], %r1315; | |
bfe.u32 %r6471, %r6464, 22, 6; | |
mul.wide.u32 %rd1607, %r6471, 28; | |
add.s64 %rd1608, %rd1604, %rd1607; | |
ld.global.u32 %r6472, [%rd1608]; | |
and.b32 %r6473, %r6472, 65535; | |
shl.b32 %r6474, %r6473, 6; | |
bfe.u32 %r6475, %r6472, 16, 6; | |
or.b32 %r16036, %r6474, %r6475; | |
st.local.u32 [%rd2+652], %r16036; | |
setp.le.u32 %p166, %r1315, %r16036; | |
mov.u32 %r16035, %r1315; | |
@%p166 bra BB12_328; | |
st.local.v2.u32 [%rd2+648], {%r16036, %r1315}; | |
mov.u32 %r14315, %r16036; | |
mov.u32 %r16036, %r1315; | |
mov.u32 %r16035, %r14315; | |
BB12_328: | |
mov.u32 %r1318, %r16035; | |
mov.u32 %r1317, %r16036; | |
setp.le.u32 %p167, %r16029, %r1318; | |
mov.u32 %r16031, %r1318; | |
mov.u32 %r16032, %r1317; | |
@%p167 bra BB12_330; | |
st.local.v4.u32 [%rd2+640], {%r1318, %r1317, %r16029, %r16030}; | |
mov.u32 %r14312, %r16030; | |
mov.u32 %r14314, %r16029; | |
mov.u32 %r16030, %r1317; | |
mov.u32 %r16029, %r1318; | |
mov.u32 %r16031, %r14314; | |
mov.u32 %r16032, %r14312; | |
BB12_330: | |
mov.u32 %r16021, %r16029; | |
mov.u32 %r16022, %r16030; | |
mov.u32 %r16023, %r16031; | |
mov.u32 %r16024, %r16032; | |
mul.lo.s64 %rd1609, %rd98, 1792; | |
add.s64 %rd1610, %rd4, %rd1609; | |
bfe.u32 %r6476, %r1309, 22, 6; | |
mul.wide.u32 %rd1611, %r6476, 28; | |
add.s64 %rd1612, %rd1610, %rd1611; | |
ld.global.u32 %r1323, [%rd1612+-12]; | |
and.b32 %r6477, %r1323, 65535; | |
cvt.u64.u32 %rd100, %r6477; | |
bfe.u32 %r6478, %r1323, 16, 6; | |
mul.wide.u32 %rd1613, %r6477, 1792; | |
add.s64 %rd1614, %rd415, %rd1613; | |
mul.wide.u32 %rd1615, %r6478, 28; | |
add.s64 %rd1616, %rd1614, %rd1615; | |
ld.global.u32 %r6479, [%rd1616]; | |
and.b32 %r6480, %r6479, 65535; | |
bfe.u32 %r6481, %r6479, 16, 6; | |
mul.wide.u32 %rd1617, %r6480, 1792; | |
add.s64 %rd1618, %rd414, %rd1617; | |
mul.wide.u32 %rd1619, %r6481, 28; | |
add.s64 %rd1620, %rd1618, %rd1619; | |
ld.global.u32 %r6482, [%rd1620]; | |
and.b32 %r6483, %r6482, 65535; | |
shl.b32 %r6484, %r6483, 6; | |
bfe.u32 %r6485, %r6482, 16, 6; | |
or.b32 %r1324, %r6484, %r6485; | |
st.local.u32 [%rd2+656], %r1324; | |
bfe.u32 %r6486, %r6479, 22, 6; | |
mul.wide.u32 %rd1621, %r6486, 28; | |
add.s64 %rd1622, %rd1618, %rd1621; | |
ld.global.u32 %r6487, [%rd1622]; | |
and.b32 %r6488, %r6487, 65535; | |
shl.b32 %r6489, %r6488, 6; | |
bfe.u32 %r6490, %r6487, 16, 6; | |
or.b32 %r16042, %r6489, %r6490; | |
st.local.u32 [%rd2+660], %r16042; | |
setp.le.u32 %p168, %r1324, %r16042; | |
mov.u32 %r16041, %r1324; | |
@%p168 bra BB12_332; | |
st.local.v2.u32 [%rd2+656], {%r16042, %r1324}; | |
mov.u32 %r14329, %r16042; | |
mov.u32 %r16042, %r1324; | |
mov.u32 %r16041, %r14329; | |
BB12_332: | |
mov.u32 %r16037, %r16041; | |
mov.u32 %r16038, %r16042; | |
bfe.u32 %r6491, %r1323, 22, 6; | |
mul.lo.s64 %rd1623, %rd100, 1792; | |
add.s64 %rd1624, %rd415, %rd1623; | |
mul.wide.u32 %rd1625, %r6491, 28; | |
add.s64 %rd1626, %rd1624, %rd1625; | |
ld.global.u32 %r6492, [%rd1626]; | |
and.b32 %r6493, %r6492, 65535; | |
bfe.u32 %r6494, %r6492, 16, 6; | |
mul.wide.u32 %rd1627, %r6493, 1792; | |
add.s64 %rd1628, %rd414, %rd1627; | |
mul.wide.u32 %rd1629, %r6494, 28; | |
add.s64 %rd1630, %rd1628, %rd1629; | |
ld.global.u32 %r6495, [%rd1630]; | |
and.b32 %r6496, %r6495, 65535; | |
shl.b32 %r6497, %r6496, 6; | |
bfe.u32 %r6498, %r6495, 16, 6; | |
or.b32 %r1328, %r6497, %r6498; | |
st.local.u32 [%rd2+664], %r1328; | |
bfe.u32 %r6499, %r6492, 22, 6; | |
mul.wide.u32 %rd1631, %r6499, 28; | |
add.s64 %rd1632, %rd1628, %rd1631; | |
ld.global.u32 %r6500, [%rd1632]; | |
and.b32 %r6501, %r6500, 65535; | |
shl.b32 %r6502, %r6501, 6; | |
bfe.u32 %r6503, %r6500, 16, 6; | |
or.b32 %r16044, %r6502, %r6503; | |
st.local.u32 [%rd2+668], %r16044; | |
setp.le.u32 %p169, %r1328, %r16044; | |
mov.u32 %r16043, %r1328; | |
@%p169 bra BB12_334; | |
st.local.v2.u32 [%rd2+664], {%r16044, %r1328}; | |
mov.u32 %r14335, %r16044; | |
mov.u32 %r16044, %r1328; | |
mov.u32 %r16043, %r14335; | |
BB12_334: | |
mov.u32 %r1331, %r16043; | |
mov.u32 %r1330, %r16044; | |
setp.le.u32 %p170, %r16037, %r1331; | |
mov.u32 %r16039, %r1331; | |
mov.u32 %r16040, %r1330; | |
@%p170 bra BB12_336; | |
st.local.v4.u32 [%rd2+656], {%r1331, %r1330, %r16037, %r16038}; | |
mov.u32 %r14332, %r16038; | |
mov.u32 %r14334, %r16037; | |
mov.u32 %r16038, %r1330; | |
mov.u32 %r16037, %r1331; | |
mov.u32 %r16039, %r14334; | |
mov.u32 %r16040, %r14332; | |
BB12_336: | |
mov.u32 %r1335, %r16037; | |
mov.u32 %r1334, %r16038; | |
mov.u32 %r1333, %r16039; | |
mov.u32 %r1332, %r16040; | |
setp.le.u32 %p171, %r16021, %r1335; | |
mov.u32 %r16025, %r1335; | |
mov.u32 %r16026, %r1334; | |
mov.u32 %r16027, %r1333; | |
mov.u32 %r16028, %r1332; | |
@%p171 bra BB12_338; | |
st.local.v4.u32 [%rd2+640], {%r1335, %r1334, %r1333, %r1332}; | |
st.local.v4.u32 [%rd2+656], {%r16021, %r16022, %r16023, %r16024}; | |
mov.u32 %r14322, %r16024; | |
mov.u32 %r14324, %r16023; | |
mov.u32 %r14326, %r16022; | |
mov.u32 %r14328, %r16021; | |
mov.u32 %r16024, %r1332; | |
mov.u32 %r16023, %r1333; | |
mov.u32 %r16022, %r1334; | |
mov.u32 %r16021, %r1335; | |
mov.u32 %r16025, %r14328; | |
mov.u32 %r16026, %r14326; | |
mov.u32 %r16027, %r14324; | |
mov.u32 %r16028, %r14322; | |
BB12_338: | |
mov.u32 %r16005, %r16021; | |
mov.u32 %r16006, %r16022; | |
mov.u32 %r16007, %r16023; | |
mov.u32 %r16008, %r16024; | |
mov.u32 %r16009, %r16025; | |
mov.u32 %r16010, %r16026; | |
mov.u32 %r16011, %r16027; | |
mov.u32 %r16012, %r16028; | |
mul.lo.s64 %rd1633, %rd97, 1792; | |
add.s64 %rd1634, %rd6, %rd1633; | |
bfe.u32 %r6504, %r1308, 22, 6; | |
mul.wide.u32 %rd1635, %r6504, 28; | |
add.s64 %rd1636, %rd1634, %rd1635; | |
ld.global.u32 %r1344, [%rd1636+-8]; | |
and.b32 %r6505, %r1344, 65535; | |
mul.wide.u32 %rd1637, %r6505, 1792; | |
add.s64 %rd1638, %rd4, %rd1637; | |
cvt.u64.u32 %rd101, %r6505; | |
bfe.u32 %r6506, %r1344, 16, 6; | |
mul.wide.u32 %rd1639, %r6506, 28; | |
add.s64 %rd1640, %rd1638, %rd1639; | |
ld.global.u32 %r1345, [%rd1640+-12]; | |
and.b32 %r6507, %r1345, 65535; | |
cvt.u64.u32 %rd102, %r6507; | |
bfe.u32 %r6508, %r1345, 16, 6; | |
mul.wide.u32 %rd1641, %r6507, 1792; | |
add.s64 %rd1642, %rd415, %rd1641; | |
mul.wide.u32 %rd1643, %r6508, 28; | |
add.s64 %rd1644, %rd1642, %rd1643; | |
ld.global.u32 %r6509, [%rd1644]; | |
and.b32 %r6510, %r6509, 65535; | |
bfe.u32 %r6511, %r6509, 16, 6; | |
mul.wide.u32 %rd1645, %r6510, 1792; | |
add.s64 %rd1646, %rd414, %rd1645; | |
mul.wide.u32 %rd1647, %r6511, 28; | |
add.s64 %rd1648, %rd1646, %rd1647; | |
ld.global.u32 %r6512, [%rd1648]; | |
and.b32 %r6513, %r6512, 65535; | |
shl.b32 %r6514, %r6513, 6; | |
bfe.u32 %r6515, %r6512, 16, 6; | |
or.b32 %r1346, %r6514, %r6515; | |
st.local.u32 [%rd2+672], %r1346; | |
bfe.u32 %r6516, %r6509, 22, 6; | |
mul.wide.u32 %rd1649, %r6516, 28; | |
add.s64 %rd1650, %rd1646, %rd1649; | |
ld.global.u32 %r6517, [%rd1650]; | |
and.b32 %r6518, %r6517, 65535; | |
shl.b32 %r6519, %r6518, 6; | |
bfe.u32 %r6520, %r6517, 16, 6; | |
or.b32 %r16058, %r6519, %r6520; | |
st.local.u32 [%rd2+676], %r16058; | |
setp.le.u32 %p172, %r1346, %r16058; | |
mov.u32 %r16057, %r1346; | |
@%p172 bra BB12_340; | |
st.local.v2.u32 [%rd2+672], {%r16058, %r1346}; | |
mov.u32 %r14365, %r16058; | |
mov.u32 %r16058, %r1346; | |
mov.u32 %r16057, %r14365; | |
BB12_340: | |
mov.u32 %r16053, %r16057; | |
mov.u32 %r16054, %r16058; | |
bfe.u32 %r6521, %r1345, 22, 6; | |
mul.lo.s64 %rd1651, %rd102, 1792; | |
add.s64 %rd1652, %rd415, %rd1651; | |
mul.wide.u32 %rd1653, %r6521, 28; | |
add.s64 %rd1654, %rd1652, %rd1653; | |
ld.global.u32 %r6522, [%rd1654]; | |
and.b32 %r6523, %r6522, 65535; | |
bfe.u32 %r6524, %r6522, 16, 6; | |
mul.wide.u32 %rd1655, %r6523, 1792; | |
add.s64 %rd1656, %rd414, %rd1655; | |
mul.wide.u32 %rd1657, %r6524, 28; | |
add.s64 %rd1658, %rd1656, %rd1657; | |
ld.global.u32 %r6525, [%rd1658]; | |
and.b32 %r6526, %r6525, 65535; | |
shl.b32 %r6527, %r6526, 6; | |
bfe.u32 %r6528, %r6525, 16, 6; | |
or.b32 %r1350, %r6527, %r6528; | |
st.local.u32 [%rd2+680], %r1350; | |
bfe.u32 %r6529, %r6522, 22, 6; | |
mul.wide.u32 %rd1659, %r6529, 28; | |
add.s64 %rd1660, %rd1656, %rd1659; | |
ld.global.u32 %r6530, [%rd1660]; | |
and.b32 %r6531, %r6530, 65535; | |
shl.b32 %r6532, %r6531, 6; | |
bfe.u32 %r6533, %r6530, 16, 6; | |
or.b32 %r16060, %r6532, %r6533; | |
st.local.u32 [%rd2+684], %r16060; | |
setp.le.u32 %p173, %r1350, %r16060; | |
mov.u32 %r16059, %r1350; | |
@%p173 bra BB12_342; | |
st.local.v2.u32 [%rd2+680], {%r16060, %r1350}; | |
mov.u32 %r14371, %r16060; | |
mov.u32 %r16060, %r1350; | |
mov.u32 %r16059, %r14371; | |
BB12_342: | |
mov.u32 %r1353, %r16059; | |
mov.u32 %r1352, %r16060; | |
setp.le.u32 %p174, %r16053, %r1353; | |
mov.u32 %r16055, %r1353; | |
mov.u32 %r16056, %r1352; | |
@%p174 bra BB12_344; | |
st.local.v4.u32 [%rd2+672], {%r1353, %r1352, %r16053, %r16054}; | |
mov.u32 %r14368, %r16054; | |
mov.u32 %r14370, %r16053; | |
mov.u32 %r16054, %r1352; | |
mov.u32 %r16053, %r1353; | |
mov.u32 %r16055, %r14370; | |
mov.u32 %r16056, %r14368; | |
BB12_344: | |
mov.u32 %r16045, %r16053; | |
mov.u32 %r16046, %r16054; | |
mov.u32 %r16047, %r16055; | |
mov.u32 %r16048, %r16056; | |
mul.lo.s64 %rd1661, %rd101, 1792; | |
add.s64 %rd1662, %rd4, %rd1661; | |
bfe.u32 %r6534, %r1344, 22, 6; | |
mul.wide.u32 %rd1663, %r6534, 28; | |
add.s64 %rd1664, %rd1662, %rd1663; | |
ld.global.u32 %r1358, [%rd1664+-12]; | |
and.b32 %r6535, %r1358, 65535; | |
cvt.u64.u32 %rd103, %r6535; | |
bfe.u32 %r6536, %r1358, 16, 6; | |
mul.wide.u32 %rd1665, %r6535, 1792; | |
add.s64 %rd1666, %rd415, %rd1665; | |
mul.wide.u32 %rd1667, %r6536, 28; | |
add.s64 %rd1668, %rd1666, %rd1667; | |
ld.global.u32 %r6537, [%rd1668]; | |
and.b32 %r6538, %r6537, 65535; | |
bfe.u32 %r6539, %r6537, 16, 6; | |
mul.wide.u32 %rd1669, %r6538, 1792; | |
add.s64 %rd1670, %rd414, %rd1669; | |
mul.wide.u32 %rd1671, %r6539, 28; | |
add.s64 %rd1672, %rd1670, %rd1671; | |
ld.global.u32 %r6540, [%rd1672]; | |
and.b32 %r6541, %r6540, 65535; | |
shl.b32 %r6542, %r6541, 6; | |
bfe.u32 %r6543, %r6540, 16, 6; | |
or.b32 %r1359, %r6542, %r6543; | |
st.local.u32 [%rd2+688], %r1359; | |
bfe.u32 %r6544, %r6537, 22, 6; | |
mul.wide.u32 %rd1673, %r6544, 28; | |
add.s64 %rd1674, %rd1670, %rd1673; | |
ld.global.u32 %r6545, [%rd1674]; | |
and.b32 %r6546, %r6545, 65535; | |
shl.b32 %r6547, %r6546, 6; | |
bfe.u32 %r6548, %r6545, 16, 6; | |
or.b32 %r16066, %r6547, %r6548; | |
st.local.u32 [%rd2+692], %r16066; | |
setp.le.u32 %p175, %r1359, %r16066; | |
mov.u32 %r16065, %r1359; | |
@%p175 bra BB12_346; | |
st.local.v2.u32 [%rd2+688], {%r16066, %r1359}; | |
mov.u32 %r14385, %r16066; | |
mov.u32 %r16066, %r1359; | |
mov.u32 %r16065, %r14385; | |
BB12_346: | |
mov.u32 %r16061, %r16065; | |
mov.u32 %r16062, %r16066; | |
bfe.u32 %r6549, %r1358, 22, 6; | |
mul.lo.s64 %rd1675, %rd103, 1792; | |
add.s64 %rd1676, %rd415, %rd1675; | |
mul.wide.u32 %rd1677, %r6549, 28; | |
add.s64 %rd1678, %rd1676, %rd1677; | |
ld.global.u32 %r6550, [%rd1678]; | |
and.b32 %r6551, %r6550, 65535; | |
bfe.u32 %r6552, %r6550, 16, 6; | |
mul.wide.u32 %rd1679, %r6551, 1792; | |
add.s64 %rd1680, %rd414, %rd1679; | |
mul.wide.u32 %rd1681, %r6552, 28; | |
add.s64 %rd1682, %rd1680, %rd1681; | |
ld.global.u32 %r6553, [%rd1682]; | |
and.b32 %r6554, %r6553, 65535; | |
shl.b32 %r6555, %r6554, 6; | |
bfe.u32 %r6556, %r6553, 16, 6; | |
or.b32 %r1363, %r6555, %r6556; | |
st.local.u32 [%rd2+696], %r1363; | |
bfe.u32 %r6557, %r6550, 22, 6; | |
mul.wide.u32 %rd1683, %r6557, 28; | |
add.s64 %rd1684, %rd1680, %rd1683; | |
ld.global.u32 %r6558, [%rd1684]; | |
and.b32 %r6559, %r6558, 65535; | |
shl.b32 %r6560, %r6559, 6; | |
bfe.u32 %r6561, %r6558, 16, 6; | |
or.b32 %r16068, %r6560, %r6561; | |
st.local.u32 [%rd2+700], %r16068; | |
setp.le.u32 %p176, %r1363, %r16068; | |
mov.u32 %r16067, %r1363; | |
@%p176 bra BB12_348; | |
st.local.v2.u32 [%rd2+696], {%r16068, %r1363}; | |
mov.u32 %r14391, %r16068; | |
mov.u32 %r16068, %r1363; | |
mov.u32 %r16067, %r14391; | |
BB12_348: | |
mov.u32 %r1366, %r16067; | |
mov.u32 %r1365, %r16068; | |
setp.le.u32 %p177, %r16061, %r1366; | |
mov.u32 %r16063, %r1366; | |
mov.u32 %r16064, %r1365; | |
@%p177 bra BB12_350; | |
st.local.v4.u32 [%rd2+688], {%r1366, %r1365, %r16061, %r16062}; | |
mov.u32 %r14388, %r16062; | |
mov.u32 %r14390, %r16061; | |
mov.u32 %r16062, %r1365; | |
mov.u32 %r16061, %r1366; | |
mov.u32 %r16063, %r14390; | |
mov.u32 %r16064, %r14388; | |
BB12_350: | |
mov.u32 %r1370, %r16061; | |
mov.u32 %r1369, %r16062; | |
mov.u32 %r1368, %r16063; | |
mov.u32 %r1367, %r16064; | |
setp.le.u32 %p178, %r16045, %r1370; | |
mov.u32 %r16049, %r1370; | |
mov.u32 %r16050, %r1369; | |
mov.u32 %r16051, %r1368; | |
mov.u32 %r16052, %r1367; | |
@%p178 bra BB12_352; | |
st.local.v4.u32 [%rd2+672], {%r1370, %r1369, %r1368, %r1367}; | |
st.local.v4.u32 [%rd2+688], {%r16045, %r16046, %r16047, %r16048}; | |
mov.u32 %r14378, %r16048; | |
mov.u32 %r14380, %r16047; | |
mov.u32 %r14382, %r16046; | |
mov.u32 %r14384, %r16045; | |
mov.u32 %r16048, %r1367; | |
mov.u32 %r16047, %r1368; | |
mov.u32 %r16046, %r1369; | |
mov.u32 %r16045, %r1370; | |
mov.u32 %r16049, %r14384; | |
mov.u32 %r16050, %r14382; | |
mov.u32 %r16051, %r14380; | |
mov.u32 %r16052, %r14378; | |
BB12_352: | |
mov.u32 %r1378, %r16045; | |
mov.u32 %r1377, %r16046; | |
mov.u32 %r1376, %r16047; | |
mov.u32 %r1375, %r16048; | |
mov.u32 %r1374, %r16049; | |
mov.u32 %r1373, %r16050; | |
mov.u32 %r1372, %r16051; | |
mov.u32 %r1371, %r16052; | |
setp.le.u32 %p179, %r16005, %r1378; | |
mov.u32 %r16013, %r1378; | |
mov.u32 %r16014, %r1377; | |
mov.u32 %r16015, %r1376; | |
mov.u32 %r16016, %r1375; | |
mov.u32 %r16017, %r1374; | |
mov.u32 %r16018, %r1373; | |
mov.u32 %r16019, %r1372; | |
mov.u32 %r16020, %r1371; | |
@%p179 bra BB12_354; | |
st.local.v4.u32 [%rd2+640], {%r1378, %r1377, %r1376, %r1375}; | |
st.local.v4.u32 [%rd2+672], {%r16005, %r16006, %r16007, %r16008}; | |
st.local.v4.u32 [%rd2+656], {%r1374, %r1373, %r1372, %r1371}; | |
st.local.v4.u32 [%rd2+688], {%r16009, %r16010, %r16011, %r16012}; | |
mov.u32 %r14350, %r16012; | |
mov.u32 %r14352, %r16011; | |
mov.u32 %r14354, %r16010; | |
mov.u32 %r14356, %r16009; | |
mov.u32 %r14358, %r16008; | |
mov.u32 %r14360, %r16007; | |
mov.u32 %r14362, %r16006; | |
mov.u32 %r14364, %r16005; | |
mov.u32 %r16012, %r1371; | |
mov.u32 %r16011, %r1372; | |
mov.u32 %r16010, %r1373; | |
mov.u32 %r16009, %r1374; | |
mov.u32 %r16008, %r1375; | |
mov.u32 %r16007, %r1376; | |
mov.u32 %r16006, %r1377; | |
mov.u32 %r16005, %r1378; | |
mov.u32 %r16013, %r14364; | |
mov.u32 %r16014, %r14362; | |
mov.u32 %r16015, %r14360; | |
mov.u32 %r16016, %r14358; | |
mov.u32 %r16017, %r14356; | |
mov.u32 %r16018, %r14354; | |
mov.u32 %r16019, %r14352; | |
mov.u32 %r16020, %r14350; | |
BB12_354: | |
mov.u32 %r15973, %r16005; | |
mov.u32 %r15974, %r16006; | |
mov.u32 %r15975, %r16007; | |
mov.u32 %r15976, %r16008; | |
mov.u32 %r15977, %r16009; | |
mov.u32 %r15978, %r16010; | |
mov.u32 %r15979, %r16011; | |
mov.u32 %r15980, %r16012; | |
mov.u32 %r15981, %r16013; | |
mov.u32 %r15982, %r16014; | |
mov.u32 %r15983, %r16015; | |
mov.u32 %r15984, %r16016; | |
mov.u32 %r15985, %r16017; | |
mov.u32 %r15986, %r16018; | |
mov.u32 %r15987, %r16019; | |
mov.u32 %r15988, %r16020; | |
mul.lo.s64 %rd1685, %rd96, 1792; | |
add.s64 %rd1686, %rd4, %rd1685; | |
bfe.u32 %r6562, %r1307, 22, 6; | |
mul.wide.u32 %rd1687, %r6562, 28; | |
add.s64 %rd1688, %rd1686, %rd1687; | |
ld.global.u32 %r1395, [%rd1688+-8]; | |
and.b32 %r6563, %r1395, 65535; | |
mul.wide.u32 %rd1689, %r6563, 1792; | |
add.s64 %rd1690, %rd6, %rd1689; | |
bfe.u32 %r6564, %r1395, 16, 6; | |
mul.wide.u32 %rd1691, %r6564, 28; | |
add.s64 %rd1692, %rd1690, %rd1691; | |
ld.global.u32 %r1396, [%rd1692+-8]; | |
and.b32 %r6565, %r1396, 65535; | |
mul.wide.u32 %rd1693, %r6565, 1792; | |
add.s64 %rd1694, %rd4, %rd1693; | |
cvt.u64.u32 %rd104, %r6563; | |
cvt.u64.u32 %rd105, %r6565; | |
bfe.u32 %r6566, %r1396, 16, 6; | |
mul.wide.u32 %rd1695, %r6566, 28; | |
add.s64 %rd1696, %rd1694, %rd1695; | |
ld.global.u32 %r1397, [%rd1696+-12]; | |
and.b32 %r6567, %r1397, 65535; | |
cvt.u64.u32 %rd106, %r6567; | |
bfe.u32 %r6568, %r1397, 16, 6; | |
mul.wide.u32 %rd1697, %r6567, 1792; | |
add.s64 %rd1698, %rd415, %rd1697; | |
mul.wide.u32 %rd1699, %r6568, 28; | |
add.s64 %rd1700, %rd1698, %rd1699; | |
ld.global.u32 %r6569, [%rd1700]; | |
and.b32 %r6570, %r6569, 65535; | |
bfe.u32 %r6571, %r6569, 16, 6; | |
mul.wide.u32 %rd1701, %r6570, 1792; | |
add.s64 %rd1702, %rd414, %rd1701; | |
mul.wide.u32 %rd1703, %r6571, 28; | |
add.s64 %rd1704, %rd1702, %rd1703; | |
ld.global.u32 %r6572, [%rd1704]; | |
and.b32 %r6573, %r6572, 65535; | |
shl.b32 %r6574, %r6573, 6; | |
bfe.u32 %r6575, %r6572, 16, 6; | |
or.b32 %r1398, %r6574, %r6575; | |
st.local.u32 [%rd2+704], %r1398; | |
bfe.u32 %r6576, %r6569, 22, 6; | |
mul.wide.u32 %rd1705, %r6576, 28; | |
add.s64 %rd1706, %rd1702, %rd1705; | |
ld.global.u32 %r6577, [%rd1706]; | |
and.b32 %r6578, %r6577, 65535; | |
shl.b32 %r6579, %r6578, 6; | |
bfe.u32 %r6580, %r6577, 16, 6; | |
or.b32 %r16098, %r6579, %r6580; | |
st.local.u32 [%rd2+708], %r16098; | |
setp.le.u32 %p180, %r1398, %r16098; | |
mov.u32 %r16097, %r1398; | |
@%p180 bra BB12_356; | |
st.local.v2.u32 [%rd2+704], {%r16098, %r1398}; | |
mov.u32 %r14453, %r16098; | |
mov.u32 %r16098, %r1398; | |
mov.u32 %r16097, %r14453; | |
BB12_356: | |
mov.u32 %r16093, %r16097; | |
mov.u32 %r16094, %r16098; | |
bfe.u32 %r6581, %r1397, 22, 6; | |
mul.lo.s64 %rd1707, %rd106, 1792; | |
add.s64 %rd1708, %rd415, %rd1707; | |
mul.wide.u32 %rd1709, %r6581, 28; | |
add.s64 %rd1710, %rd1708, %rd1709; | |
ld.global.u32 %r6582, [%rd1710]; | |
and.b32 %r6583, %r6582, 65535; | |
bfe.u32 %r6584, %r6582, 16, 6; | |
mul.wide.u32 %rd1711, %r6583, 1792; | |
add.s64 %rd1712, %rd414, %rd1711; | |
mul.wide.u32 %rd1713, %r6584, 28; | |
add.s64 %rd1714, %rd1712, %rd1713; | |
ld.global.u32 %r6585, [%rd1714]; | |
and.b32 %r6586, %r6585, 65535; | |
shl.b32 %r6587, %r6586, 6; | |
bfe.u32 %r6588, %r6585, 16, 6; | |
or.b32 %r1402, %r6587, %r6588; | |
st.local.u32 [%rd2+712], %r1402; | |
bfe.u32 %r6589, %r6582, 22, 6; | |
mul.wide.u32 %rd1715, %r6589, 28; | |
add.s64 %rd1716, %rd1712, %rd1715; | |
ld.global.u32 %r6590, [%rd1716]; | |
and.b32 %r6591, %r6590, 65535; | |
shl.b32 %r6592, %r6591, 6; | |
bfe.u32 %r6593, %r6590, 16, 6; | |
or.b32 %r16100, %r6592, %r6593; | |
st.local.u32 [%rd2+716], %r16100; | |
setp.le.u32 %p181, %r1402, %r16100; | |
mov.u32 %r16099, %r1402; | |
@%p181 bra BB12_358; | |
st.local.v2.u32 [%rd2+712], {%r16100, %r1402}; | |
mov.u32 %r14459, %r16100; | |
mov.u32 %r16100, %r1402; | |
mov.u32 %r16099, %r14459; | |
BB12_358: | |
mov.u32 %r1405, %r16099; | |
mov.u32 %r1404, %r16100; | |
setp.le.u32 %p182, %r16093, %r1405; | |
mov.u32 %r16095, %r1405; | |
mov.u32 %r16096, %r1404; | |
@%p182 bra BB12_360; | |
st.local.v4.u32 [%rd2+704], {%r1405, %r1404, %r16093, %r16094}; | |
mov.u32 %r14456, %r16094; | |
mov.u32 %r14458, %r16093; | |
mov.u32 %r16094, %r1404; | |
mov.u32 %r16093, %r1405; | |
mov.u32 %r16095, %r14458; | |
mov.u32 %r16096, %r14456; | |
BB12_360: | |
mov.u32 %r16085, %r16093; | |
mov.u32 %r16086, %r16094; | |
mov.u32 %r16087, %r16095; | |
mov.u32 %r16088, %r16096; | |
mul.lo.s64 %rd1717, %rd105, 1792; | |
add.s64 %rd1718, %rd4, %rd1717; | |
bfe.u32 %r6594, %r1396, 22, 6; | |
mul.wide.u32 %rd1719, %r6594, 28; | |
add.s64 %rd1720, %rd1718, %rd1719; | |
ld.global.u32 %r1410, [%rd1720+-12]; | |
and.b32 %r6595, %r1410, 65535; | |
cvt.u64.u32 %rd107, %r6595; | |
bfe.u32 %r6596, %r1410, 16, 6; | |
mul.wide.u32 %rd1721, %r6595, 1792; | |
add.s64 %rd1722, %rd415, %rd1721; | |
mul.wide.u32 %rd1723, %r6596, 28; | |
add.s64 %rd1724, %rd1722, %rd1723; | |
ld.global.u32 %r6597, [%rd1724]; | |
and.b32 %r6598, %r6597, 65535; | |
bfe.u32 %r6599, %r6597, 16, 6; | |
mul.wide.u32 %rd1725, %r6598, 1792; | |
add.s64 %rd1726, %rd414, %rd1725; | |
mul.wide.u32 %rd1727, %r6599, 28; | |
add.s64 %rd1728, %rd1726, %rd1727; | |
ld.global.u32 %r6600, [%rd1728]; | |
and.b32 %r6601, %r6600, 65535; | |
shl.b32 %r6602, %r6601, 6; | |
bfe.u32 %r6603, %r6600, 16, 6; | |
or.b32 %r1411, %r6602, %r6603; | |
st.local.u32 [%rd2+720], %r1411; | |
bfe.u32 %r6604, %r6597, 22, 6; | |
mul.wide.u32 %rd1729, %r6604, 28; | |
add.s64 %rd1730, %rd1726, %rd1729; | |
ld.global.u32 %r6605, [%rd1730]; | |
and.b32 %r6606, %r6605, 65535; | |
shl.b32 %r6607, %r6606, 6; | |
bfe.u32 %r6608, %r6605, 16, 6; | |
or.b32 %r16106, %r6607, %r6608; | |
st.local.u32 [%rd2+724], %r16106; | |
setp.le.u32 %p183, %r1411, %r16106; | |
mov.u32 %r16105, %r1411; | |
@%p183 bra BB12_362; | |
st.local.v2.u32 [%rd2+720], {%r16106, %r1411}; | |
mov.u32 %r14473, %r16106; | |
mov.u32 %r16106, %r1411; | |
mov.u32 %r16105, %r14473; | |
BB12_362: | |
mov.u32 %r16101, %r16105; | |
mov.u32 %r16102, %r16106; | |
bfe.u32 %r6609, %r1410, 22, 6; | |
mul.lo.s64 %rd1731, %rd107, 1792; | |
add.s64 %rd1732, %rd415, %rd1731; | |
mul.wide.u32 %rd1733, %r6609, 28; | |
add.s64 %rd1734, %rd1732, %rd1733; | |
ld.global.u32 %r6610, [%rd1734]; | |
and.b32 %r6611, %r6610, 65535; | |
bfe.u32 %r6612, %r6610, 16, 6; | |
mul.wide.u32 %rd1735, %r6611, 1792; | |
add.s64 %rd1736, %rd414, %rd1735; | |
mul.wide.u32 %rd1737, %r6612, 28; | |
add.s64 %rd1738, %rd1736, %rd1737; | |
ld.global.u32 %r6613, [%rd1738]; | |
and.b32 %r6614, %r6613, 65535; | |
shl.b32 %r6615, %r6614, 6; | |
bfe.u32 %r6616, %r6613, 16, 6; | |
or.b32 %r1415, %r6615, %r6616; | |
st.local.u32 [%rd2+728], %r1415; | |
bfe.u32 %r6617, %r6610, 22, 6; | |
mul.wide.u32 %rd1739, %r6617, 28; | |
add.s64 %rd1740, %rd1736, %rd1739; | |
ld.global.u32 %r6618, [%rd1740]; | |
and.b32 %r6619, %r6618, 65535; | |
shl.b32 %r6620, %r6619, 6; | |
bfe.u32 %r6621, %r6618, 16, 6; | |
or.b32 %r16108, %r6620, %r6621; | |
st.local.u32 [%rd2+732], %r16108; | |
setp.le.u32 %p184, %r1415, %r16108; | |
mov.u32 %r16107, %r1415; | |
@%p184 bra BB12_364; | |
st.local.v2.u32 [%rd2+728], {%r16108, %r1415}; | |
mov.u32 %r14479, %r16108; | |
mov.u32 %r16108, %r1415; | |
mov.u32 %r16107, %r14479; | |
BB12_364: | |
mov.u32 %r1418, %r16107; | |
mov.u32 %r1417, %r16108; | |
setp.le.u32 %p185, %r16101, %r1418; | |
mov.u32 %r16103, %r1418; | |
mov.u32 %r16104, %r1417; | |
@%p185 bra BB12_366; | |
st.local.v4.u32 [%rd2+720], {%r1418, %r1417, %r16101, %r16102}; | |
mov.u32 %r14476, %r16102; | |
mov.u32 %r14478, %r16101; | |
mov.u32 %r16102, %r1417; | |
mov.u32 %r16101, %r1418; | |
mov.u32 %r16103, %r14478; | |
mov.u32 %r16104, %r14476; | |
BB12_366: | |
mov.u32 %r1422, %r16101; | |
mov.u32 %r1421, %r16102; | |
mov.u32 %r1420, %r16103; | |
mov.u32 %r1419, %r16104; | |
setp.le.u32 %p186, %r16085, %r1422; | |
mov.u32 %r16089, %r1422; | |
mov.u32 %r16090, %r1421; | |
mov.u32 %r16091, %r1420; | |
mov.u32 %r16092, %r1419; | |
@%p186 bra BB12_368; | |
st.local.v4.u32 [%rd2+704], {%r1422, %r1421, %r1420, %r1419}; | |
st.local.v4.u32 [%rd2+720], {%r16085, %r16086, %r16087, %r16088}; | |
mov.u32 %r14466, %r16088; | |
mov.u32 %r14468, %r16087; | |
mov.u32 %r14470, %r16086; | |
mov.u32 %r14472, %r16085; | |
mov.u32 %r16088, %r1419; | |
mov.u32 %r16087, %r1420; | |
mov.u32 %r16086, %r1421; | |
mov.u32 %r16085, %r1422; | |
mov.u32 %r16089, %r14472; | |
mov.u32 %r16090, %r14470; | |
mov.u32 %r16091, %r14468; | |
mov.u32 %r16092, %r14466; | |
BB12_368: | |
mov.u32 %r16069, %r16085; | |
mov.u32 %r16070, %r16086; | |
mov.u32 %r16071, %r16087; | |
mov.u32 %r16072, %r16088; | |
mov.u32 %r16073, %r16089; | |
mov.u32 %r16074, %r16090; | |
mov.u32 %r16075, %r16091; | |
mov.u32 %r16076, %r16092; | |
mul.lo.s64 %rd1741, %rd104, 1792; | |
add.s64 %rd1742, %rd6, %rd1741; | |
bfe.u32 %r6622, %r1395, 22, 6; | |
mul.wide.u32 %rd1743, %r6622, 28; | |
add.s64 %rd1744, %rd1742, %rd1743; | |
ld.global.u32 %r1431, [%rd1744+-8]; | |
and.b32 %r6623, %r1431, 65535; | |
mul.wide.u32 %rd1745, %r6623, 1792; | |
add.s64 %rd1746, %rd4, %rd1745; | |
cvt.u64.u32 %rd108, %r6623; | |
bfe.u32 %r6624, %r1431, 16, 6; | |
mul.wide.u32 %rd1747, %r6624, 28; | |
add.s64 %rd1748, %rd1746, %rd1747; | |
ld.global.u32 %r1432, [%rd1748+-12]; | |
and.b32 %r6625, %r1432, 65535; | |
cvt.u64.u32 %rd109, %r6625; | |
bfe.u32 %r6626, %r1432, 16, 6; | |
mul.wide.u32 %rd1749, %r6625, 1792; | |
add.s64 %rd1750, %rd415, %rd1749; | |
mul.wide.u32 %rd1751, %r6626, 28; | |
add.s64 %rd1752, %rd1750, %rd1751; | |
ld.global.u32 %r6627, [%rd1752]; | |
and.b32 %r6628, %r6627, 65535; | |
bfe.u32 %r6629, %r6627, 16, 6; | |
mul.wide.u32 %rd1753, %r6628, 1792; | |
add.s64 %rd1754, %rd414, %rd1753; | |
mul.wide.u32 %rd1755, %r6629, 28; | |
add.s64 %rd1756, %rd1754, %rd1755; | |
ld.global.u32 %r6630, [%rd1756]; | |
and.b32 %r6631, %r6630, 65535; | |
shl.b32 %r6632, %r6631, 6; | |
bfe.u32 %r6633, %r6630, 16, 6; | |
or.b32 %r1433, %r6632, %r6633; | |
st.local.u32 [%rd2+736], %r1433; | |
bfe.u32 %r6634, %r6627, 22, 6; | |
mul.wide.u32 %rd1757, %r6634, 28; | |
add.s64 %rd1758, %rd1754, %rd1757; | |
ld.global.u32 %r6635, [%rd1758]; | |
and.b32 %r6636, %r6635, 65535; | |
shl.b32 %r6637, %r6636, 6; | |
bfe.u32 %r6638, %r6635, 16, 6; | |
or.b32 %r16122, %r6637, %r6638; | |
st.local.u32 [%rd2+740], %r16122; | |
setp.le.u32 %p187, %r1433, %r16122; | |
mov.u32 %r16121, %r1433; | |
@%p187 bra BB12_370; | |
st.local.v2.u32 [%rd2+736], {%r16122, %r1433}; | |
mov.u32 %r14509, %r16122; | |
mov.u32 %r16122, %r1433; | |
mov.u32 %r16121, %r14509; | |
BB12_370: | |
mov.u32 %r16117, %r16121; | |
mov.u32 %r16118, %r16122; | |
bfe.u32 %r6639, %r1432, 22, 6; | |
mul.lo.s64 %rd1759, %rd109, 1792; | |
add.s64 %rd1760, %rd415, %rd1759; | |
mul.wide.u32 %rd1761, %r6639, 28; | |
add.s64 %rd1762, %rd1760, %rd1761; | |
ld.global.u32 %r6640, [%rd1762]; | |
and.b32 %r6641, %r6640, 65535; | |
bfe.u32 %r6642, %r6640, 16, 6; | |
mul.wide.u32 %rd1763, %r6641, 1792; | |
add.s64 %rd1764, %rd414, %rd1763; | |
mul.wide.u32 %rd1765, %r6642, 28; | |
add.s64 %rd1766, %rd1764, %rd1765; | |
ld.global.u32 %r6643, [%rd1766]; | |
and.b32 %r6644, %r6643, 65535; | |
shl.b32 %r6645, %r6644, 6; | |
bfe.u32 %r6646, %r6643, 16, 6; | |
or.b32 %r1437, %r6645, %r6646; | |
st.local.u32 [%rd2+744], %r1437; | |
bfe.u32 %r6647, %r6640, 22, 6; | |
mul.wide.u32 %rd1767, %r6647, 28; | |
add.s64 %rd1768, %rd1764, %rd1767; | |
ld.global.u32 %r6648, [%rd1768]; | |
and.b32 %r6649, %r6648, 65535; | |
shl.b32 %r6650, %r6649, 6; | |
bfe.u32 %r6651, %r6648, 16, 6; | |
or.b32 %r16124, %r6650, %r6651; | |
st.local.u32 [%rd2+748], %r16124; | |
setp.le.u32 %p188, %r1437, %r16124; | |
mov.u32 %r16123, %r1437; | |
@%p188 bra BB12_372; | |
st.local.v2.u32 [%rd2+744], {%r16124, %r1437}; | |
mov.u32 %r14515, %r16124; | |
mov.u32 %r16124, %r1437; | |
mov.u32 %r16123, %r14515; | |
BB12_372: | |
mov.u32 %r1440, %r16123; | |
mov.u32 %r1439, %r16124; | |
setp.le.u32 %p189, %r16117, %r1440; | |
mov.u32 %r16119, %r1440; | |
mov.u32 %r16120, %r1439; | |
@%p189 bra BB12_374; | |
st.local.v4.u32 [%rd2+736], {%r1440, %r1439, %r16117, %r16118}; | |
mov.u32 %r14512, %r16118; | |
mov.u32 %r14514, %r16117; | |
mov.u32 %r16118, %r1439; | |
mov.u32 %r16117, %r1440; | |
mov.u32 %r16119, %r14514; | |
mov.u32 %r16120, %r14512; | |
BB12_374: | |
mov.u32 %r16109, %r16117; | |
mov.u32 %r16110, %r16118; | |
mov.u32 %r16111, %r16119; | |
mov.u32 %r16112, %r16120; | |
mul.lo.s64 %rd1769, %rd108, 1792; | |
add.s64 %rd1770, %rd4, %rd1769; | |
bfe.u32 %r6652, %r1431, 22, 6; | |
mul.wide.u32 %rd1771, %r6652, 28; | |
add.s64 %rd1772, %rd1770, %rd1771; | |
ld.global.u32 %r1445, [%rd1772+-12]; | |
and.b32 %r6653, %r1445, 65535; | |
cvt.u64.u32 %rd110, %r6653; | |
bfe.u32 %r6654, %r1445, 16, 6; | |
mul.wide.u32 %rd1773, %r6653, 1792; | |
add.s64 %rd1774, %rd415, %rd1773; | |
mul.wide.u32 %rd1775, %r6654, 28; | |
add.s64 %rd1776, %rd1774, %rd1775; | |
ld.global.u32 %r6655, [%rd1776]; | |
and.b32 %r6656, %r6655, 65535; | |
bfe.u32 %r6657, %r6655, 16, 6; | |
mul.wide.u32 %rd1777, %r6656, 1792; | |
add.s64 %rd1778, %rd414, %rd1777; | |
mul.wide.u32 %rd1779, %r6657, 28; | |
add.s64 %rd1780, %rd1778, %rd1779; | |
ld.global.u32 %r6658, [%rd1780]; | |
and.b32 %r6659, %r6658, 65535; | |
shl.b32 %r6660, %r6659, 6; | |
bfe.u32 %r6661, %r6658, 16, 6; | |
or.b32 %r1446, %r6660, %r6661; | |
st.local.u32 [%rd2+752], %r1446; | |
bfe.u32 %r6662, %r6655, 22, 6; | |
mul.wide.u32 %rd1781, %r6662, 28; | |
add.s64 %rd1782, %rd1778, %rd1781; | |
ld.global.u32 %r6663, [%rd1782]; | |
and.b32 %r6664, %r6663, 65535; | |
shl.b32 %r6665, %r6664, 6; | |
bfe.u32 %r6666, %r6663, 16, 6; | |
or.b32 %r16130, %r6665, %r6666; | |
st.local.u32 [%rd2+756], %r16130; | |
setp.le.u32 %p190, %r1446, %r16130; | |
mov.u32 %r16129, %r1446; | |
@%p190 bra BB12_376; | |
st.local.v2.u32 [%rd2+752], {%r16130, %r1446}; | |
mov.u32 %r14529, %r16130; | |
mov.u32 %r16130, %r1446; | |
mov.u32 %r16129, %r14529; | |
BB12_376: | |
mov.u32 %r16125, %r16129; | |
mov.u32 %r16126, %r16130; | |
bfe.u32 %r6667, %r1445, 22, 6; | |
mul.lo.s64 %rd1783, %rd110, 1792; | |
add.s64 %rd1784, %rd415, %rd1783; | |
mul.wide.u32 %rd1785, %r6667, 28; | |
add.s64 %rd1786, %rd1784, %rd1785; | |
ld.global.u32 %r6668, [%rd1786]; | |
and.b32 %r6669, %r6668, 65535; | |
bfe.u32 %r6670, %r6668, 16, 6; | |
mul.wide.u32 %rd1787, %r6669, 1792; | |
add.s64 %rd1788, %rd414, %rd1787; | |
mul.wide.u32 %rd1789, %r6670, 28; | |
add.s64 %rd1790, %rd1788, %rd1789; | |
ld.global.u32 %r6671, [%rd1790]; | |
and.b32 %r6672, %r6671, 65535; | |
shl.b32 %r6673, %r6672, 6; | |
bfe.u32 %r6674, %r6671, 16, 6; | |
or.b32 %r1450, %r6673, %r6674; | |
st.local.u32 [%rd2+760], %r1450; | |
bfe.u32 %r6675, %r6668, 22, 6; | |
mul.wide.u32 %rd1791, %r6675, 28; | |
add.s64 %rd1792, %rd1788, %rd1791; | |
ld.global.u32 %r6676, [%rd1792]; | |
and.b32 %r6677, %r6676, 65535; | |
shl.b32 %r6678, %r6677, 6; | |
bfe.u32 %r6679, %r6676, 16, 6; | |
or.b32 %r16132, %r6678, %r6679; | |
st.local.u32 [%rd2+764], %r16132; | |
setp.le.u32 %p191, %r1450, %r16132; | |
mov.u32 %r16131, %r1450; | |
@%p191 bra BB12_378; | |
st.local.v2.u32 [%rd2+760], {%r16132, %r1450}; | |
mov.u32 %r14535, %r16132; | |
mov.u32 %r16132, %r1450; | |
mov.u32 %r16131, %r14535; | |
BB12_378: | |
mov.u32 %r1453, %r16131; | |
mov.u32 %r1452, %r16132; | |
setp.le.u32 %p192, %r16125, %r1453; | |
mov.u32 %r16127, %r1453; | |
mov.u32 %r16128, %r1452; | |
@%p192 bra BB12_380; | |
st.local.v4.u32 [%rd2+752], {%r1453, %r1452, %r16125, %r16126}; | |
mov.u32 %r14532, %r16126; | |
mov.u32 %r14534, %r16125; | |
mov.u32 %r16126, %r1452; | |
mov.u32 %r16125, %r1453; | |
mov.u32 %r16127, %r14534; | |
mov.u32 %r16128, %r14532; | |
BB12_380: | |
mov.u32 %r1457, %r16125; | |
mov.u32 %r1456, %r16126; | |
mov.u32 %r1455, %r16127; | |
mov.u32 %r1454, %r16128; | |
setp.le.u32 %p193, %r16109, %r1457; | |
mov.u32 %r16113, %r1457; | |
mov.u32 %r16114, %r1456; | |
mov.u32 %r16115, %r1455; | |
mov.u32 %r16116, %r1454; | |
@%p193 bra BB12_382; | |
st.local.v4.u32 [%rd2+736], {%r1457, %r1456, %r1455, %r1454}; | |
st.local.v4.u32 [%rd2+752], {%r16109, %r16110, %r16111, %r16112}; | |
mov.u32 %r14522, %r16112; | |
mov.u32 %r14524, %r16111; | |
mov.u32 %r14526, %r16110; | |
mov.u32 %r14528, %r16109; | |
mov.u32 %r16112, %r1454; | |
mov.u32 %r16111, %r1455; | |
mov.u32 %r16110, %r1456; | |
mov.u32 %r16109, %r1457; | |
mov.u32 %r16113, %r14528; | |
mov.u32 %r16114, %r14526; | |
mov.u32 %r16115, %r14524; | |
mov.u32 %r16116, %r14522; | |
BB12_382: | |
mov.u32 %r1465, %r16109; | |
mov.u32 %r1464, %r16110; | |
mov.u32 %r1463, %r16111; | |
mov.u32 %r1462, %r16112; | |
mov.u32 %r1461, %r16113; | |
mov.u32 %r1460, %r16114; | |
mov.u32 %r1459, %r16115; | |
mov.u32 %r1458, %r16116; | |
setp.le.u32 %p194, %r16069, %r1465; | |
mov.u32 %r16077, %r1465; | |
mov.u32 %r16078, %r1464; | |
mov.u32 %r16079, %r1463; | |
mov.u32 %r16080, %r1462; | |
mov.u32 %r16081, %r1461; | |
mov.u32 %r16082, %r1460; | |
mov.u32 %r16083, %r1459; | |
mov.u32 %r16084, %r1458; | |
@%p194 bra BB12_384; | |
st.local.v4.u32 [%rd2+704], {%r1465, %r1464, %r1463, %r1462}; | |
st.local.v4.u32 [%rd2+736], {%r16069, %r16070, %r16071, %r16072}; | |
st.local.v4.u32 [%rd2+720], {%r1461, %r1460, %r1459, %r1458}; | |
st.local.v4.u32 [%rd2+752], {%r16073, %r16074, %r16075, %r16076}; | |
mov.u32 %r14494, %r16076; | |
mov.u32 %r14496, %r16075; | |
mov.u32 %r14498, %r16074; | |
mov.u32 %r14500, %r16073; | |
mov.u32 %r14502, %r16072; | |
mov.u32 %r14504, %r16071; | |
mov.u32 %r14506, %r16070; | |
mov.u32 %r14508, %r16069; | |
mov.u32 %r16076, %r1458; | |
mov.u32 %r16075, %r1459; | |
mov.u32 %r16074, %r1460; | |
mov.u32 %r16073, %r1461; | |
mov.u32 %r16072, %r1462; | |
mov.u32 %r16071, %r1463; | |
mov.u32 %r16070, %r1464; | |
mov.u32 %r16069, %r1465; | |
mov.u32 %r16077, %r14508; | |
mov.u32 %r16078, %r14506; | |
mov.u32 %r16079, %r14504; | |
mov.u32 %r16080, %r14502; | |
mov.u32 %r16081, %r14500; | |
mov.u32 %r16082, %r14498; | |
mov.u32 %r16083, %r14496; | |
mov.u32 %r16084, %r14494; | |
BB12_384: | |
mov.u32 %r1481, %r16069; | |
mov.u32 %r1480, %r16070; | |
mov.u32 %r1479, %r16071; | |
mov.u32 %r1478, %r16072; | |
mov.u32 %r1477, %r16073; | |
mov.u32 %r1476, %r16074; | |
mov.u32 %r1475, %r16075; | |
mov.u32 %r1474, %r16076; | |
mov.u32 %r1473, %r16077; | |
mov.u32 %r1472, %r16078; | |
mov.u32 %r1471, %r16079; | |
mov.u32 %r1470, %r16080; | |
mov.u32 %r1469, %r16081; | |
mov.u32 %r1468, %r16082; | |
mov.u32 %r1467, %r16083; | |
mov.u32 %r1466, %r16084; | |
setp.le.u32 %p195, %r15973, %r1481; | |
mov.u32 %r15989, %r1481; | |
mov.u32 %r15990, %r1480; | |
mov.u32 %r15991, %r1479; | |
mov.u32 %r15992, %r1478; | |
mov.u32 %r15993, %r1477; | |
mov.u32 %r15994, %r1476; | |
mov.u32 %r15995, %r1475; | |
mov.u32 %r15996, %r1474; | |
mov.u32 %r15997, %r1473; | |
mov.u32 %r15998, %r1472; | |
mov.u32 %r15999, %r1471; | |
mov.u32 %r16000, %r1470; | |
mov.u32 %r16001, %r1469; | |
mov.u32 %r16002, %r1468; | |
mov.u32 %r16003, %r1467; | |
mov.u32 %r16004, %r1466; | |
@%p195 bra BB12_386; | |
st.local.v4.u32 [%rd2+640], {%r1481, %r1480, %r1479, %r1478}; | |
st.local.v4.u32 [%rd2+704], {%r15973, %r15974, %r15975, %r15976}; | |
st.local.v4.u32 [%rd2+656], {%r1477, %r1476, %r1475, %r1474}; | |
st.local.v4.u32 [%rd2+720], {%r15977, %r15978, %r15979, %r15980}; | |
st.local.v4.u32 [%rd2+672], {%r1473, %r1472, %r1471, %r1470}; | |
st.local.v4.u32 [%rd2+736], {%r15981, %r15982, %r15983, %r15984}; | |
st.local.v4.u32 [%rd2+688], {%r1469, %r1468, %r1467, %r1466}; | |
st.local.v4.u32 [%rd2+752], {%r15985, %r15986, %r15987, %r15988}; | |
mov.u32 %r14422, %r15988; | |
mov.u32 %r14424, %r15987; | |
mov.u32 %r14426, %r15986; | |
mov.u32 %r14428, %r15985; | |
mov.u32 %r14430, %r15984; | |
mov.u32 %r14432, %r15983; | |
mov.u32 %r14434, %r15982; | |
mov.u32 %r14436, %r15981; | |
mov.u32 %r14438, %r15980; | |
mov.u32 %r14440, %r15979; | |
mov.u32 %r14442, %r15978; | |
mov.u32 %r14444, %r15977; | |
mov.u32 %r14446, %r15976; | |
mov.u32 %r14448, %r15975; | |
mov.u32 %r14450, %r15974; | |
mov.u32 %r14452, %r15973; | |
mov.u32 %r15988, %r1466; | |
mov.u32 %r15987, %r1467; | |
mov.u32 %r15986, %r1468; | |
mov.u32 %r15985, %r1469; | |
mov.u32 %r15984, %r1470; | |
mov.u32 %r15983, %r1471; | |
mov.u32 %r15982, %r1472; | |
mov.u32 %r15981, %r1473; | |
mov.u32 %r15980, %r1474; | |
mov.u32 %r15979, %r1475; | |
mov.u32 %r15978, %r1476; | |
mov.u32 %r15977, %r1477; | |
mov.u32 %r15976, %r1478; | |
mov.u32 %r15975, %r1479; | |
mov.u32 %r15974, %r1480; | |
mov.u32 %r15973, %r1481; | |
mov.u32 %r15989, %r14452; | |
mov.u32 %r15990, %r14450; | |
mov.u32 %r15991, %r14448; | |
mov.u32 %r15992, %r14446; | |
mov.u32 %r15993, %r14444; | |
mov.u32 %r15994, %r14442; | |
mov.u32 %r15995, %r14440; | |
mov.u32 %r15996, %r14438; | |
mov.u32 %r15997, %r14436; | |
mov.u32 %r15998, %r14434; | |
mov.u32 %r15999, %r14432; | |
mov.u32 %r16000, %r14430; | |
mov.u32 %r16001, %r14428; | |
mov.u32 %r16002, %r14426; | |
mov.u32 %r16003, %r14424; | |
mov.u32 %r16004, %r14422; | |
BB12_386: | |
mov.u32 %r1513, %r15973; | |
mov.u32 %r1512, %r15974; | |
mov.u32 %r1511, %r15975; | |
mov.u32 %r1510, %r15976; | |
mov.u32 %r1509, %r15977; | |
mov.u32 %r1508, %r15978; | |
mov.u32 %r1507, %r15979; | |
mov.u32 %r1506, %r15980; | |
mov.u32 %r1505, %r15981; | |
mov.u32 %r1504, %r15982; | |
mov.u32 %r1503, %r15983; | |
mov.u32 %r1502, %r15984; | |
mov.u32 %r1501, %r15985; | |
mov.u32 %r1500, %r15986; | |
mov.u32 %r1499, %r15987; | |
mov.u32 %r1498, %r15988; | |
mov.u32 %r1497, %r15989; | |
mov.u32 %r1496, %r15990; | |
mov.u32 %r1495, %r15991; | |
mov.u32 %r1494, %r15992; | |
mov.u32 %r1493, %r15993; | |
mov.u32 %r1492, %r15994; | |
mov.u32 %r1491, %r15995; | |
mov.u32 %r1490, %r15996; | |
mov.u32 %r1489, %r15997; | |
mov.u32 %r1488, %r15998; | |
mov.u32 %r1487, %r15999; | |
mov.u32 %r1486, %r16000; | |
mov.u32 %r1485, %r16001; | |
mov.u32 %r1484, %r16002; | |
mov.u32 %r1483, %r16003; | |
mov.u32 %r1482, %r16004; | |
setp.le.u32 %p196, %r15749, %r1513; | |
mov.u32 %r15781, %r1513; | |
mov.u32 %r15782, %r1512; | |
mov.u32 %r15783, %r1511; | |
mov.u32 %r15784, %r1510; | |
mov.u32 %r15785, %r1509; | |
mov.u32 %r15786, %r1508; | |
mov.u32 %r15787, %r1507; | |
mov.u32 %r15788, %r1506; | |
mov.u32 %r15789, %r1505; | |
mov.u32 %r15790, %r1504; | |
mov.u32 %r15791, %r1503; | |
mov.u32 %r15792, %r1502; | |
mov.u32 %r15793, %r1501; | |
mov.u32 %r15794, %r1500; | |
mov.u32 %r15795, %r1499; | |
mov.u32 %r15796, %r1498; | |
mov.u32 %r15797, %r1497; | |
mov.u32 %r15798, %r1496; | |
mov.u32 %r15799, %r1495; | |
mov.u32 %r15800, %r1494; | |
mov.u32 %r15801, %r1493; | |
mov.u32 %r15802, %r1492; | |
mov.u32 %r15803, %r1491; | |
mov.u32 %r15804, %r1490; | |
mov.u32 %r15805, %r1489; | |
mov.u32 %r15806, %r1488; | |
mov.u32 %r15807, %r1487; | |
mov.u32 %r15808, %r1486; | |
mov.u32 %r15809, %r1485; | |
mov.u32 %r15810, %r1484; | |
mov.u32 %r15811, %r1483; | |
mov.u32 %r15812, %r1482; | |
@%p196 bra BB12_388; | |
st.local.v4.u32 [%rd2+512], {%r1513, %r1512, %r1511, %r1510}; | |
st.local.v4.u32 [%rd2+640], {%r15749, %r15750, %r15751, %r15752}; | |
st.local.v4.u32 [%rd2+528], {%r1509, %r1508, %r1507, %r1506}; | |
st.local.v4.u32 [%rd2+656], {%r15753, %r15754, %r15755, %r15756}; | |
st.local.v4.u32 [%rd2+544], {%r1505, %r1504, %r1503, %r1502}; | |
st.local.v4.u32 [%rd2+672], {%r15757, %r15758, %r15759, %r15760}; | |
st.local.v4.u32 [%rd2+560], {%r1501, %r1500, %r1499, %r1498}; | |
st.local.v4.u32 [%rd2+688], {%r15761, %r15762, %r15763, %r15764}; | |
st.local.v4.u32 [%rd2+576], {%r1497, %r1496, %r1495, %r1494}; | |
st.local.v4.u32 [%rd2+704], {%r15765, %r15766, %r15767, %r15768}; | |
st.local.v4.u32 [%rd2+592], {%r1493, %r1492, %r1491, %r1490}; | |
st.local.v4.u32 [%rd2+720], {%r15769, %r15770, %r15771, %r15772}; | |
st.local.v4.u32 [%rd2+608], {%r1489, %r1488, %r1487, %r1486}; | |
st.local.v4.u32 [%rd2+736], {%r15773, %r15774, %r15775, %r15776}; | |
st.local.v4.u32 [%rd2+624], {%r1485, %r1484, %r1483, %r1482}; | |
st.local.v4.u32 [%rd2+752], {%r15777, %r15778, %r15779, %r15780}; | |
mov.u32 %r14246, %r15780; | |
mov.u32 %r14248, %r15779; | |
mov.u32 %r14250, %r15778; | |
mov.u32 %r14252, %r15777; | |
mov.u32 %r14254, %r15776; | |
mov.u32 %r14256, %r15775; | |
mov.u32 %r14258, %r15774; | |
mov.u32 %r14260, %r15773; | |
mov.u32 %r14262, %r15772; | |
mov.u32 %r14264, %r15771; | |
mov.u32 %r14266, %r15770; | |
mov.u32 %r14268, %r15769; | |
mov.u32 %r14270, %r15768; | |
mov.u32 %r14272, %r15767; | |
mov.u32 %r14274, %r15766; | |
mov.u32 %r14276, %r15765; | |
mov.u32 %r14278, %r15764; | |
mov.u32 %r14280, %r15763; | |
mov.u32 %r14282, %r15762; | |
mov.u32 %r14284, %r15761; | |
mov.u32 %r14286, %r15760; | |
mov.u32 %r14288, %r15759; | |
mov.u32 %r14290, %r15758; | |
mov.u32 %r14292, %r15757; | |
mov.u32 %r14294, %r15756; | |
mov.u32 %r14296, %r15755; | |
mov.u32 %r14298, %r15754; | |
mov.u32 %r14300, %r15753; | |
mov.u32 %r14302, %r15752; | |
mov.u32 %r14304, %r15751; | |
mov.u32 %r14306, %r15750; | |
mov.u32 %r14308, %r15749; | |
mov.u32 %r15780, %r1482; | |
mov.u32 %r15779, %r1483; | |
mov.u32 %r15778, %r1484; | |
mov.u32 %r15777, %r1485; | |
mov.u32 %r15776, %r1486; | |
mov.u32 %r15775, %r1487; | |
mov.u32 %r15774, %r1488; | |
mov.u32 %r15773, %r1489; | |
mov.u32 %r15772, %r1490; | |
mov.u32 %r15771, %r1491; | |
mov.u32 %r15770, %r1492; | |
mov.u32 %r15769, %r1493; | |
mov.u32 %r15768, %r1494; | |
mov.u32 %r15767, %r1495; | |
mov.u32 %r15766, %r1496; | |
mov.u32 %r15765, %r1497; | |
mov.u32 %r15764, %r1498; | |
mov.u32 %r15763, %r1499; | |
mov.u32 %r15762, %r1500; | |
mov.u32 %r15761, %r1501; | |
mov.u32 %r15760, %r1502; | |
mov.u32 %r15759, %r1503; | |
mov.u32 %r15758, %r1504; | |
mov.u32 %r15757, %r1505; | |
mov.u32 %r15756, %r1506; | |
mov.u32 %r15755, %r1507; | |
mov.u32 %r15754, %r1508; | |
mov.u32 %r15753, %r1509; | |
mov.u32 %r15752, %r1510; | |
mov.u32 %r15751, %r1511; | |
mov.u32 %r15750, %r1512; | |
mov.u32 %r15749, %r1513; | |
mov.u32 %r15781, %r14308; | |
mov.u32 %r15782, %r14306; | |
mov.u32 %r15783, %r14304; | |
mov.u32 %r15784, %r14302; | |
mov.u32 %r15785, %r14300; | |
mov.u32 %r15786, %r14298; | |
mov.u32 %r15787, %r14296; | |
mov.u32 %r15788, %r14294; | |
mov.u32 %r15789, %r14292; | |
mov.u32 %r15790, %r14290; | |
mov.u32 %r15791, %r14288; | |
mov.u32 %r15792, %r14286; | |
mov.u32 %r15793, %r14284; | |
mov.u32 %r15794, %r14282; | |
mov.u32 %r15795, %r14280; | |
mov.u32 %r15796, %r14278; | |
mov.u32 %r15797, %r14276; | |
mov.u32 %r15798, %r14274; | |
mov.u32 %r15799, %r14272; | |
mov.u32 %r15800, %r14270; | |
mov.u32 %r15801, %r14268; | |
mov.u32 %r15802, %r14266; | |
mov.u32 %r15803, %r14264; | |
mov.u32 %r15804, %r14262; | |
mov.u32 %r15805, %r14260; | |
mov.u32 %r15806, %r14258; | |
mov.u32 %r15807, %r14256; | |
mov.u32 %r15808, %r14254; | |
mov.u32 %r15809, %r14252; | |
mov.u32 %r15810, %r14250; | |
mov.u32 %r15811, %r14248; | |
mov.u32 %r15812, %r14246; | |
BB12_388: | |
mov.u32 %r15621, %r15749; | |
mov.u32 %r15622, %r15750; | |
mov.u32 %r15623, %r15751; | |
mov.u32 %r15624, %r15752; | |
mov.u32 %r15625, %r15753; | |
mov.u32 %r15626, %r15754; | |
mov.u32 %r15627, %r15755; | |
mov.u32 %r15628, %r15756; | |
mov.u32 %r15629, %r15757; | |
mov.u32 %r15630, %r15758; | |
mov.u32 %r15631, %r15759; | |
mov.u32 %r15632, %r15760; | |
mov.u32 %r15633, %r15761; | |
mov.u32 %r15634, %r15762; | |
mov.u32 %r15635, %r15763; | |
mov.u32 %r15636, %r15764; | |
mov.u32 %r15637, %r15765; | |
mov.u32 %r15638, %r15766; | |
mov.u32 %r15639, %r15767; | |
mov.u32 %r15640, %r15768; | |
mov.u32 %r15641, %r15769; | |
mov.u32 %r15642, %r15770; | |
mov.u32 %r15643, %r15771; | |
mov.u32 %r15644, %r15772; | |
mov.u32 %r15645, %r15773; | |
mov.u32 %r15646, %r15774; | |
mov.u32 %r15647, %r15775; | |
mov.u32 %r15648, %r15776; | |
mov.u32 %r15649, %r15777; | |
mov.u32 %r15650, %r15778; | |
mov.u32 %r15651, %r15779; | |
mov.u32 %r15652, %r15780; | |
mov.u32 %r15653, %r15781; | |
mov.u32 %r15654, %r15782; | |
mov.u32 %r15655, %r15783; | |
mov.u32 %r15656, %r15784; | |
mov.u32 %r15657, %r15785; | |
mov.u32 %r15658, %r15786; | |
mov.u32 %r15659, %r15787; | |
mov.u32 %r15660, %r15788; | |
mov.u32 %r15661, %r15789; | |
mov.u32 %r15662, %r15790; | |
mov.u32 %r15663, %r15791; | |
mov.u32 %r15664, %r15792; | |
mov.u32 %r15665, %r15793; | |
mov.u32 %r15666, %r15794; | |
mov.u32 %r15667, %r15795; | |
mov.u32 %r15668, %r15796; | |
mov.u32 %r15669, %r15797; | |
mov.u32 %r15670, %r15798; | |
mov.u32 %r15671, %r15799; | |
mov.u32 %r15672, %r15800; | |
mov.u32 %r15673, %r15801; | |
mov.u32 %r15674, %r15802; | |
mov.u32 %r15675, %r15803; | |
mov.u32 %r15676, %r15804; | |
mov.u32 %r15677, %r15805; | |
mov.u32 %r15678, %r15806; | |
mov.u32 %r15679, %r15807; | |
mov.u32 %r15680, %r15808; | |
mov.u32 %r15681, %r15809; | |
mov.u32 %r15682, %r15810; | |
mov.u32 %r15683, %r15811; | |
mov.u32 %r15684, %r15812; | |
mul.lo.s64 %rd1793, %rd79, 1792; | |
add.s64 %rd1794, %rd4, %rd1793; | |
bfe.u32 %r6680, %r1098, 22, 6; | |
mul.wide.u32 %rd1795, %r6680, 28; | |
add.s64 %rd1796, %rd1794, %rd1795; | |
ld.global.u32 %r1578, [%rd1796+-4]; | |
and.b32 %r6681, %r1578, 65535; | |
mul.wide.u32 %rd1797, %r6681, 1792; | |
add.s64 %rd1798, %rd6, %rd1797; | |
bfe.u32 %r6682, %r1578, 16, 6; | |
mul.wide.u32 %rd1799, %r6682, 28; | |
add.s64 %rd1800, %rd1798, %rd1799; | |
ld.global.u32 %r1579, [%rd1800+-4]; | |
and.b32 %r6683, %r1579, 65535; | |
mul.wide.u32 %rd1801, %r6683, 1792; | |
add.s64 %rd1802, %rd4, %rd1801; | |
bfe.u32 %r6684, %r1579, 16, 6; | |
mul.wide.u32 %rd1803, %r6684, 28; | |
add.s64 %rd1804, %rd1802, %rd1803; | |
ld.global.u32 %r1580, [%rd1804+-8]; | |
and.b32 %r6685, %r1580, 65535; | |
mul.wide.u32 %rd1805, %r6685, 1792; | |
add.s64 %rd1806, %rd6, %rd1805; | |
bfe.u32 %r6686, %r1580, 16, 6; | |
mul.wide.u32 %rd1807, %r6686, 28; | |
add.s64 %rd1808, %rd1806, %rd1807; | |
ld.global.u32 %r1581, [%rd1808+-8]; | |
and.b32 %r6687, %r1581, 65535; | |
mul.wide.u32 %rd1809, %r6687, 1792; | |
add.s64 %rd1810, %rd4, %rd1809; | |
cvt.u64.u32 %rd111, %r6681; | |
cvt.u64.u32 %rd112, %r6683; | |
cvt.u64.u32 %rd113, %r6685; | |
cvt.u64.u32 %rd114, %r6687; | |
bfe.u32 %r6688, %r1581, 16, 6; | |
mul.wide.u32 %rd1811, %r6688, 28; | |
add.s64 %rd1812, %rd1810, %rd1811; | |
ld.global.u32 %r1582, [%rd1812+-12]; | |
and.b32 %r6689, %r1582, 65535; | |
cvt.u64.u32 %rd115, %r6689; | |
bfe.u32 %r6690, %r1582, 16, 6; | |
mul.wide.u32 %rd1813, %r6689, 1792; | |
add.s64 %rd1814, %rd415, %rd1813; | |
mul.wide.u32 %rd1815, %r6690, 28; | |
add.s64 %rd1816, %rd1814, %rd1815; | |
ld.global.u32 %r6691, [%rd1816]; | |
and.b32 %r6692, %r6691, 65535; | |
bfe.u32 %r6693, %r6691, 16, 6; | |
mul.wide.u32 %rd1817, %r6692, 1792; | |
add.s64 %rd1818, %rd414, %rd1817; | |
mul.wide.u32 %rd1819, %r6693, 28; | |
add.s64 %rd1820, %rd1818, %rd1819; | |
ld.global.u32 %r6694, [%rd1820]; | |
and.b32 %r6695, %r6694, 65535; | |
shl.b32 %r6696, %r6695, 6; | |
bfe.u32 %r6697, %r6694, 16, 6; | |
or.b32 %r1583, %r6696, %r6697; | |
st.local.u32 [%rd2+768], %r1583; | |
bfe.u32 %r6698, %r6691, 22, 6; | |
mul.wide.u32 %rd1821, %r6698, 28; | |
add.s64 %rd1822, %rd1818, %rd1821; | |
ld.global.u32 %r6699, [%rd1822]; | |
and.b32 %r6700, %r6699, 65535; | |
shl.b32 %r6701, %r6700, 6; | |
bfe.u32 %r6702, %r6699, 16, 6; | |
or.b32 %r16258, %r6701, %r6702; | |
st.local.u32 [%rd2+772], %r16258; | |
setp.le.u32 %p197, %r1583, %r16258; | |
mov.u32 %r16257, %r1583; | |
@%p197 bra BB12_390; | |
st.local.v2.u32 [%rd2+768], {%r16258, %r1583}; | |
mov.u32 %r14789, %r16258; | |
mov.u32 %r16258, %r1583; | |
mov.u32 %r16257, %r14789; | |
BB12_390: | |
mov.u32 %r16253, %r16257; | |
mov.u32 %r16254, %r16258; | |
bfe.u32 %r6703, %r1582, 22, 6; | |
mul.lo.s64 %rd1823, %rd115, 1792; | |
add.s64 %rd1824, %rd415, %rd1823; | |
mul.wide.u32 %rd1825, %r6703, 28; | |
add.s64 %rd1826, %rd1824, %rd1825; | |
ld.global.u32 %r6704, [%rd1826]; | |
and.b32 %r6705, %r6704, 65535; | |
bfe.u32 %r6706, %r6704, 16, 6; | |
mul.wide.u32 %rd1827, %r6705, 1792; | |
add.s64 %rd1828, %rd414, %rd1827; | |
mul.wide.u32 %rd1829, %r6706, 28; | |
add.s64 %rd1830, %rd1828, %rd1829; | |
ld.global.u32 %r6707, [%rd1830]; | |
and.b32 %r6708, %r6707, 65535; | |
shl.b32 %r6709, %r6708, 6; | |
bfe.u32 %r6710, %r6707, 16, 6; | |
or.b32 %r1587, %r6709, %r6710; | |
st.local.u32 [%rd2+776], %r1587; | |
bfe.u32 %r6711, %r6704, 22, 6; | |
mul.wide.u32 %rd1831, %r6711, 28; | |
add.s64 %rd1832, %rd1828, %rd1831; | |
ld.global.u32 %r6712, [%rd1832]; | |
and.b32 %r6713, %r6712, 65535; | |
shl.b32 %r6714, %r6713, 6; | |
bfe.u32 %r6715, %r6712, 16, 6; | |
or.b32 %r16260, %r6714, %r6715; | |
st.local.u32 [%rd2+780], %r16260; | |
setp.le.u32 %p198, %r1587, %r16260; | |
mov.u32 %r16259, %r1587; | |
@%p198 bra BB12_392; | |
st.local.v2.u32 [%rd2+776], {%r16260, %r1587}; | |
mov.u32 %r14795, %r16260; | |
mov.u32 %r16260, %r1587; | |
mov.u32 %r16259, %r14795; | |
BB12_392: | |
mov.u32 %r1590, %r16259; | |
mov.u32 %r1589, %r16260; | |
setp.le.u32 %p199, %r16253, %r1590; | |
mov.u32 %r16255, %r1590; | |
mov.u32 %r16256, %r1589; | |
@%p199 bra BB12_394; | |
st.local.v4.u32 [%rd2+768], {%r1590, %r1589, %r16253, %r16254}; | |
mov.u32 %r14792, %r16254; | |
mov.u32 %r14794, %r16253; | |
mov.u32 %r16254, %r1589; | |
mov.u32 %r16253, %r1590; | |
mov.u32 %r16255, %r14794; | |
mov.u32 %r16256, %r14792; | |
BB12_394: | |
mov.u32 %r16245, %r16253; | |
mov.u32 %r16246, %r16254; | |
mov.u32 %r16247, %r16255; | |
mov.u32 %r16248, %r16256; | |
mul.lo.s64 %rd1833, %rd114, 1792; | |
add.s64 %rd1834, %rd4, %rd1833; | |
bfe.u32 %r6716, %r1581, 22, 6; | |
mul.wide.u32 %rd1835, %r6716, 28; | |
add.s64 %rd1836, %rd1834, %rd1835; | |
ld.global.u32 %r1595, [%rd1836+-12]; | |
and.b32 %r6717, %r1595, 65535; | |
cvt.u64.u32 %rd116, %r6717; | |
bfe.u32 %r6718, %r1595, 16, 6; | |
mul.wide.u32 %rd1837, %r6717, 1792; | |
add.s64 %rd1838, %rd415, %rd1837; | |
mul.wide.u32 %rd1839, %r6718, 28; | |
add.s64 %rd1840, %rd1838, %rd1839; | |
ld.global.u32 %r6719, [%rd1840]; | |
and.b32 %r6720, %r6719, 65535; | |
bfe.u32 %r6721, %r6719, 16, 6; | |
mul.wide.u32 %rd1841, %r6720, 1792; | |
add.s64 %rd1842, %rd414, %rd1841; | |
mul.wide.u32 %rd1843, %r6721, 28; | |
add.s64 %rd1844, %rd1842, %rd1843; | |
ld.global.u32 %r6722, [%rd1844]; | |
and.b32 %r6723, %r6722, 65535; | |
shl.b32 %r6724, %r6723, 6; | |
bfe.u32 %r6725, %r6722, 16, 6; | |
or.b32 %r1596, %r6724, %r6725; | |
st.local.u32 [%rd2+784], %r1596; | |
bfe.u32 %r6726, %r6719, 22, 6; | |
mul.wide.u32 %rd1845, %r6726, 28; | |
add.s64 %rd1846, %rd1842, %rd1845; | |
ld.global.u32 %r6727, [%rd1846]; | |
and.b32 %r6728, %r6727, 65535; | |
shl.b32 %r6729, %r6728, 6; | |
bfe.u32 %r6730, %r6727, 16, 6; | |
or.b32 %r16266, %r6729, %r6730; | |
st.local.u32 [%rd2+788], %r16266; | |
setp.le.u32 %p200, %r1596, %r16266; | |
mov.u32 %r16265, %r1596; | |
@%p200 bra BB12_396; | |
st.local.v2.u32 [%rd2+784], {%r16266, %r1596}; | |
mov.u32 %r14809, %r16266; | |
mov.u32 %r16266, %r1596; | |
mov.u32 %r16265, %r14809; | |
BB12_396: | |
mov.u32 %r16261, %r16265; | |
mov.u32 %r16262, %r16266; | |
bfe.u32 %r6731, %r1595, 22, 6; | |
mul.lo.s64 %rd1847, %rd116, 1792; | |
add.s64 %rd1848, %rd415, %rd1847; | |
mul.wide.u32 %rd1849, %r6731, 28; | |
add.s64 %rd1850, %rd1848, %rd1849; | |
ld.global.u32 %r6732, [%rd1850]; | |
and.b32 %r6733, %r6732, 65535; | |
bfe.u32 %r6734, %r6732, 16, 6; | |
mul.wide.u32 %rd1851, %r6733, 1792; | |
add.s64 %rd1852, %rd414, %rd1851; | |
mul.wide.u32 %rd1853, %r6734, 28; | |
add.s64 %rd1854, %rd1852, %rd1853; | |
ld.global.u32 %r6735, [%rd1854]; | |
and.b32 %r6736, %r6735, 65535; | |
shl.b32 %r6737, %r6736, 6; | |
bfe.u32 %r6738, %r6735, 16, 6; | |
or.b32 %r1600, %r6737, %r6738; | |
st.local.u32 [%rd2+792], %r1600; | |
bfe.u32 %r6739, %r6732, 22, 6; | |
mul.wide.u32 %rd1855, %r6739, 28; | |
add.s64 %rd1856, %rd1852, %rd1855; | |
ld.global.u32 %r6740, [%rd1856]; | |
and.b32 %r6741, %r6740, 65535; | |
shl.b32 %r6742, %r6741, 6; | |
bfe.u32 %r6743, %r6740, 16, 6; | |
or.b32 %r16268, %r6742, %r6743; | |
st.local.u32 [%rd2+796], %r16268; | |
setp.le.u32 %p201, %r1600, %r16268; | |
mov.u32 %r16267, %r1600; | |
@%p201 bra BB12_398; | |
st.local.v2.u32 [%rd2+792], {%r16268, %r1600}; | |
mov.u32 %r14815, %r16268; | |
mov.u32 %r16268, %r1600; | |
mov.u32 %r16267, %r14815; | |
BB12_398: | |
mov.u32 %r1603, %r16267; | |
mov.u32 %r1602, %r16268; | |
setp.le.u32 %p202, %r16261, %r1603; | |
mov.u32 %r16263, %r1603; | |
mov.u32 %r16264, %r1602; | |
@%p202 bra BB12_400; | |
st.local.v4.u32 [%rd2+784], {%r1603, %r1602, %r16261, %r16262}; | |
mov.u32 %r14812, %r16262; | |
mov.u32 %r14814, %r16261; | |
mov.u32 %r16262, %r1602; | |
mov.u32 %r16261, %r1603; | |
mov.u32 %r16263, %r14814; | |
mov.u32 %r16264, %r14812; | |
BB12_400: | |
mov.u32 %r1607, %r16261; | |
mov.u32 %r1606, %r16262; | |
mov.u32 %r1605, %r16263; | |
mov.u32 %r1604, %r16264; | |
setp.le.u32 %p203, %r16245, %r1607; | |
mov.u32 %r16249, %r1607; | |
mov.u32 %r16250, %r1606; | |
mov.u32 %r16251, %r1605; | |
mov.u32 %r16252, %r1604; | |
@%p203 bra BB12_402; | |
st.local.v4.u32 [%rd2+768], {%r1607, %r1606, %r1605, %r1604}; | |
st.local.v4.u32 [%rd2+784], {%r16245, %r16246, %r16247, %r16248}; | |
mov.u32 %r14802, %r16248; | |
mov.u32 %r14804, %r16247; | |
mov.u32 %r14806, %r16246; | |
mov.u32 %r14808, %r16245; | |
mov.u32 %r16248, %r1604; | |
mov.u32 %r16247, %r1605; | |
mov.u32 %r16246, %r1606; | |
mov.u32 %r16245, %r1607; | |
mov.u32 %r16249, %r14808; | |
mov.u32 %r16250, %r14806; | |
mov.u32 %r16251, %r14804; | |
mov.u32 %r16252, %r14802; | |
BB12_402: | |
mov.u32 %r16229, %r16245; | |
mov.u32 %r16230, %r16246; | |
mov.u32 %r16231, %r16247; | |
mov.u32 %r16232, %r16248; | |
mov.u32 %r16233, %r16249; | |
mov.u32 %r16234, %r16250; | |
mov.u32 %r16235, %r16251; | |
mov.u32 %r16236, %r16252; | |
mul.lo.s64 %rd1857, %rd113, 1792; | |
add.s64 %rd1858, %rd6, %rd1857; | |
bfe.u32 %r6744, %r1580, 22, 6; | |
mul.wide.u32 %rd1859, %r6744, 28; | |
add.s64 %rd1860, %rd1858, %rd1859; | |
ld.global.u32 %r1616, [%rd1860+-8]; | |
and.b32 %r6745, %r1616, 65535; | |
mul.wide.u32 %rd1861, %r6745, 1792; | |
add.s64 %rd1862, %rd4, %rd1861; | |
cvt.u64.u32 %rd117, %r6745; | |
bfe.u32 %r6746, %r1616, 16, 6; | |
mul.wide.u32 %rd1863, %r6746, 28; | |
add.s64 %rd1864, %rd1862, %rd1863; | |
ld.global.u32 %r1617, [%rd1864+-12]; | |
and.b32 %r6747, %r1617, 65535; | |
cvt.u64.u32 %rd118, %r6747; | |
bfe.u32 %r6748, %r1617, 16, 6; | |
mul.wide.u32 %rd1865, %r6747, 1792; | |
add.s64 %rd1866, %rd415, %rd1865; | |
mul.wide.u32 %rd1867, %r6748, 28; | |
add.s64 %rd1868, %rd1866, %rd1867; | |
ld.global.u32 %r6749, [%rd1868]; | |
and.b32 %r6750, %r6749, 65535; | |
bfe.u32 %r6751, %r6749, 16, 6; | |
mul.wide.u32 %rd1869, %r6750, 1792; | |
add.s64 %rd1870, %rd414, %rd1869; | |
mul.wide.u32 %rd1871, %r6751, 28; | |
add.s64 %rd1872, %rd1870, %rd1871; | |
ld.global.u32 %r6752, [%rd1872]; | |
and.b32 %r6753, %r6752, 65535; | |
shl.b32 %r6754, %r6753, 6; | |
bfe.u32 %r6755, %r6752, 16, 6; | |
or.b32 %r1618, %r6754, %r6755; | |
st.local.u32 [%rd2+800], %r1618; | |
bfe.u32 %r6756, %r6749, 22, 6; | |
mul.wide.u32 %rd1873, %r6756, 28; | |
add.s64 %rd1874, %rd1870, %rd1873; | |
ld.global.u32 %r6757, [%rd1874]; | |
and.b32 %r6758, %r6757, 65535; | |
shl.b32 %r6759, %r6758, 6; | |
bfe.u32 %r6760, %r6757, 16, 6; | |
or.b32 %r16282, %r6759, %r6760; | |
st.local.u32 [%rd2+804], %r16282; | |
setp.le.u32 %p204, %r1618, %r16282; | |
mov.u32 %r16281, %r1618; | |
@%p204 bra BB12_404; | |
st.local.v2.u32 [%rd2+800], {%r16282, %r1618}; | |
mov.u32 %r14845, %r16282; | |
mov.u32 %r16282, %r1618; | |
mov.u32 %r16281, %r14845; | |
BB12_404: | |
mov.u32 %r16277, %r16281; | |
mov.u32 %r16278, %r16282; | |
bfe.u32 %r6761, %r1617, 22, 6; | |
mul.lo.s64 %rd1875, %rd118, 1792; | |
add.s64 %rd1876, %rd415, %rd1875; | |
mul.wide.u32 %rd1877, %r6761, 28; | |
add.s64 %rd1878, %rd1876, %rd1877; | |
ld.global.u32 %r6762, [%rd1878]; | |
and.b32 %r6763, %r6762, 65535; | |
bfe.u32 %r6764, %r6762, 16, 6; | |
mul.wide.u32 %rd1879, %r6763, 1792; | |
add.s64 %rd1880, %rd414, %rd1879; | |
mul.wide.u32 %rd1881, %r6764, 28; | |
add.s64 %rd1882, %rd1880, %rd1881; | |
ld.global.u32 %r6765, [%rd1882]; | |
and.b32 %r6766, %r6765, 65535; | |
shl.b32 %r6767, %r6766, 6; | |
bfe.u32 %r6768, %r6765, 16, 6; | |
or.b32 %r1622, %r6767, %r6768; | |
st.local.u32 [%rd2+808], %r1622; | |
bfe.u32 %r6769, %r6762, 22, 6; | |
mul.wide.u32 %rd1883, %r6769, 28; | |
add.s64 %rd1884, %rd1880, %rd1883; | |
ld.global.u32 %r6770, [%rd1884]; | |
and.b32 %r6771, %r6770, 65535; | |
shl.b32 %r6772, %r6771, 6; | |
bfe.u32 %r6773, %r6770, 16, 6; | |
or.b32 %r16284, %r6772, %r6773; | |
st.local.u32 [%rd2+812], %r16284; | |
setp.le.u32 %p205, %r1622, %r16284; | |
mov.u32 %r16283, %r1622; | |
@%p205 bra BB12_406; | |
st.local.v2.u32 [%rd2+808], {%r16284, %r1622}; | |
mov.u32 %r14851, %r16284; | |
mov.u32 %r16284, %r1622; | |
mov.u32 %r16283, %r14851; | |
BB12_406: | |
mov.u32 %r1625, %r16283; | |
mov.u32 %r1624, %r16284; | |
setp.le.u32 %p206, %r16277, %r1625; | |
mov.u32 %r16279, %r1625; | |
mov.u32 %r16280, %r1624; | |
@%p206 bra BB12_408; | |
st.local.v4.u32 [%rd2+800], {%r1625, %r1624, %r16277, %r16278}; | |
mov.u32 %r14848, %r16278; | |
mov.u32 %r14850, %r16277; | |
mov.u32 %r16278, %r1624; | |
mov.u32 %r16277, %r1625; | |
mov.u32 %r16279, %r14850; | |
mov.u32 %r16280, %r14848; | |
BB12_408: | |
mov.u32 %r16269, %r16277; | |
mov.u32 %r16270, %r16278; | |
mov.u32 %r16271, %r16279; | |
mov.u32 %r16272, %r16280; | |
mul.lo.s64 %rd1885, %rd117, 1792; | |
add.s64 %rd1886, %rd4, %rd1885; | |
bfe.u32 %r6774, %r1616, 22, 6; | |
mul.wide.u32 %rd1887, %r6774, 28; | |
add.s64 %rd1888, %rd1886, %rd1887; | |
ld.global.u32 %r1630, [%rd1888+-12]; | |
and.b32 %r6775, %r1630, 65535; | |
cvt.u64.u32 %rd119, %r6775; | |
bfe.u32 %r6776, %r1630, 16, 6; | |
mul.wide.u32 %rd1889, %r6775, 1792; | |
add.s64 %rd1890, %rd415, %rd1889; | |
mul.wide.u32 %rd1891, %r6776, 28; | |
add.s64 %rd1892, %rd1890, %rd1891; | |
ld.global.u32 %r6777, [%rd1892]; | |
and.b32 %r6778, %r6777, 65535; | |
bfe.u32 %r6779, %r6777, 16, 6; | |
mul.wide.u32 %rd1893, %r6778, 1792; | |
add.s64 %rd1894, %rd414, %rd1893; | |
mul.wide.u32 %rd1895, %r6779, 28; | |
add.s64 %rd1896, %rd1894, %rd1895; | |
ld.global.u32 %r6780, [%rd1896]; | |
and.b32 %r6781, %r6780, 65535; | |
shl.b32 %r6782, %r6781, 6; | |
bfe.u32 %r6783, %r6780, 16, 6; | |
or.b32 %r1631, %r6782, %r6783; | |
st.local.u32 [%rd2+816], %r1631; | |
bfe.u32 %r6784, %r6777, 22, 6; | |
mul.wide.u32 %rd1897, %r6784, 28; | |
add.s64 %rd1898, %rd1894, %rd1897; | |
ld.global.u32 %r6785, [%rd1898]; | |
and.b32 %r6786, %r6785, 65535; | |
shl.b32 %r6787, %r6786, 6; | |
bfe.u32 %r6788, %r6785, 16, 6; | |
or.b32 %r16290, %r6787, %r6788; | |
st.local.u32 [%rd2+820], %r16290; | |
setp.le.u32 %p207, %r1631, %r16290; | |
mov.u32 %r16289, %r1631; | |
@%p207 bra BB12_410; | |
st.local.v2.u32 [%rd2+816], {%r16290, %r1631}; | |
mov.u32 %r14865, %r16290; | |
mov.u32 %r16290, %r1631; | |
mov.u32 %r16289, %r14865; | |
BB12_410: | |
mov.u32 %r16285, %r16289; | |
mov.u32 %r16286, %r16290; | |
bfe.u32 %r6789, %r1630, 22, 6; | |
mul.lo.s64 %rd1899, %rd119, 1792; | |
add.s64 %rd1900, %rd415, %rd1899; | |
mul.wide.u32 %rd1901, %r6789, 28; | |
add.s64 %rd1902, %rd1900, %rd1901; | |
ld.global.u32 %r6790, [%rd1902]; | |
and.b32 %r6791, %r6790, 65535; | |
bfe.u32 %r6792, %r6790, 16, 6; | |
mul.wide.u32 %rd1903, %r6791, 1792; | |
add.s64 %rd1904, %rd414, %rd1903; | |
mul.wide.u32 %rd1905, %r6792, 28; | |
add.s64 %rd1906, %rd1904, %rd1905; | |
ld.global.u32 %r6793, [%rd1906]; | |
and.b32 %r6794, %r6793, 65535; | |
shl.b32 %r6795, %r6794, 6; | |
bfe.u32 %r6796, %r6793, 16, 6; | |
or.b32 %r1635, %r6795, %r6796; | |
st.local.u32 [%rd2+824], %r1635; | |
bfe.u32 %r6797, %r6790, 22, 6; | |
mul.wide.u32 %rd1907, %r6797, 28; | |
add.s64 %rd1908, %rd1904, %rd1907; | |
ld.global.u32 %r6798, [%rd1908]; | |
and.b32 %r6799, %r6798, 65535; | |
shl.b32 %r6800, %r6799, 6; | |
bfe.u32 %r6801, %r6798, 16, 6; | |
or.b32 %r16292, %r6800, %r6801; | |
st.local.u32 [%rd2+828], %r16292; | |
setp.le.u32 %p208, %r1635, %r16292; | |
mov.u32 %r16291, %r1635; | |
@%p208 bra BB12_412; | |
st.local.v2.u32 [%rd2+824], {%r16292, %r1635}; | |
mov.u32 %r14871, %r16292; | |
mov.u32 %r16292, %r1635; | |
mov.u32 %r16291, %r14871; | |
BB12_412: | |
mov.u32 %r1638, %r16291; | |
mov.u32 %r1637, %r16292; | |
setp.le.u32 %p209, %r16285, %r1638; | |
mov.u32 %r16287, %r1638; | |
mov.u32 %r16288, %r1637; | |
@%p209 bra BB12_414; | |
st.local.v4.u32 [%rd2+816], {%r1638, %r1637, %r16285, %r16286}; | |
mov.u32 %r14868, %r16286; | |
mov.u32 %r14870, %r16285; | |
mov.u32 %r16286, %r1637; | |
mov.u32 %r16285, %r1638; | |
mov.u32 %r16287, %r14870; | |
mov.u32 %r16288, %r14868; | |
BB12_414: | |
mov.u32 %r1642, %r16285; | |
mov.u32 %r1641, %r16286; | |
mov.u32 %r1640, %r16287; | |
mov.u32 %r1639, %r16288; | |
setp.le.u32 %p210, %r16269, %r1642; | |
mov.u32 %r16273, %r1642; | |
mov.u32 %r16274, %r1641; | |
mov.u32 %r16275, %r1640; | |
mov.u32 %r16276, %r1639; | |
@%p210 bra BB12_416; | |
st.local.v4.u32 [%rd2+800], {%r1642, %r1641, %r1640, %r1639}; | |
st.local.v4.u32 [%rd2+816], {%r16269, %r16270, %r16271, %r16272}; | |
mov.u32 %r14858, %r16272; | |
mov.u32 %r14860, %r16271; | |
mov.u32 %r14862, %r16270; | |
mov.u32 %r14864, %r16269; | |
mov.u32 %r16272, %r1639; | |
mov.u32 %r16271, %r1640; | |
mov.u32 %r16270, %r1641; | |
mov.u32 %r16269, %r1642; | |
mov.u32 %r16273, %r14864; | |
mov.u32 %r16274, %r14862; | |
mov.u32 %r16275, %r14860; | |
mov.u32 %r16276, %r14858; | |
BB12_416: | |
mov.u32 %r1650, %r16269; | |
mov.u32 %r1649, %r16270; | |
mov.u32 %r1648, %r16271; | |
mov.u32 %r1647, %r16272; | |
mov.u32 %r1646, %r16273; | |
mov.u32 %r1645, %r16274; | |
mov.u32 %r1644, %r16275; | |
mov.u32 %r1643, %r16276; | |
setp.le.u32 %p211, %r16229, %r1650; | |
mov.u32 %r16237, %r1650; | |
mov.u32 %r16238, %r1649; | |
mov.u32 %r16239, %r1648; | |
mov.u32 %r16240, %r1647; | |
mov.u32 %r16241, %r1646; | |
mov.u32 %r16242, %r1645; | |
mov.u32 %r16243, %r1644; | |
mov.u32 %r16244, %r1643; | |
@%p211 bra BB12_418; | |
st.local.v4.u32 [%rd2+768], {%r1650, %r1649, %r1648, %r1647}; | |
st.local.v4.u32 [%rd2+800], {%r16229, %r16230, %r16231, %r16232}; | |
st.local.v4.u32 [%rd2+784], {%r1646, %r1645, %r1644, %r1643}; | |
st.local.v4.u32 [%rd2+816], {%r16233, %r16234, %r16235, %r16236}; | |
mov.u32 %r14830, %r16236; | |
mov.u32 %r14832, %r16235; | |
mov.u32 %r14834, %r16234; | |
mov.u32 %r14836, %r16233; | |
mov.u32 %r14838, %r16232; | |
mov.u32 %r14840, %r16231; | |
mov.u32 %r14842, %r16230; | |
mov.u32 %r14844, %r16229; | |
mov.u32 %r16236, %r1643; | |
mov.u32 %r16235, %r1644; | |
mov.u32 %r16234, %r1645; | |
mov.u32 %r16233, %r1646; | |
mov.u32 %r16232, %r1647; | |
mov.u32 %r16231, %r1648; | |
mov.u32 %r16230, %r1649; | |
mov.u32 %r16229, %r1650; | |
mov.u32 %r16237, %r14844; | |
mov.u32 %r16238, %r14842; | |
mov.u32 %r16239, %r14840; | |
mov.u32 %r16240, %r14838; | |
mov.u32 %r16241, %r14836; | |
mov.u32 %r16242, %r14834; | |
mov.u32 %r16243, %r14832; | |
mov.u32 %r16244, %r14830; | |
BB12_418: | |
mov.u32 %r16197, %r16229; | |
mov.u32 %r16198, %r16230; | |
mov.u32 %r16199, %r16231; | |
mov.u32 %r16200, %r16232; | |
mov.u32 %r16201, %r16233; | |
mov.u32 %r16202, %r16234; | |
mov.u32 %r16203, %r16235; | |
mov.u32 %r16204, %r16236; | |
mov.u32 %r16205, %r16237; | |
mov.u32 %r16206, %r16238; | |
mov.u32 %r16207, %r16239; | |
mov.u32 %r16208, %r16240; | |
mov.u32 %r16209, %r16241; | |
mov.u32 %r16210, %r16242; | |
mov.u32 %r16211, %r16243; | |
mov.u32 %r16212, %r16244; | |
mul.lo.s64 %rd1909, %rd112, 1792; | |
add.s64 %rd1910, %rd4, %rd1909; | |
bfe.u32 %r6802, %r1579, 22, 6; | |
mul.wide.u32 %rd1911, %r6802, 28; | |
add.s64 %rd1912, %rd1910, %rd1911; | |
ld.global.u32 %r1667, [%rd1912+-8]; | |
and.b32 %r6803, %r1667, 65535; | |
mul.wide.u32 %rd1913, %r6803, 1792; | |
add.s64 %rd1914, %rd6, %rd1913; | |
bfe.u32 %r6804, %r1667, 16, 6; | |
mul.wide.u32 %rd1915, %r6804, 28; | |
add.s64 %rd1916, %rd1914, %rd1915; | |
ld.global.u32 %r1668, [%rd1916+-8]; | |
and.b32 %r6805, %r1668, 65535; | |
mul.wide.u32 %rd1917, %r6805, 1792; | |
add.s64 %rd1918, %rd4, %rd1917; | |
cvt.u64.u32 %rd120, %r6803; | |
cvt.u64.u32 %rd121, %r6805; | |
bfe.u32 %r6806, %r1668, 16, 6; | |
mul.wide.u32 %rd1919, %r6806, 28; | |
add.s64 %rd1920, %rd1918, %rd1919; | |
ld.global.u32 %r1669, [%rd1920+-12]; | |
and.b32 %r6807, %r1669, 65535; | |
cvt.u64.u32 %rd122, %r6807; | |
bfe.u32 %r6808, %r1669, 16, 6; | |
mul.wide.u32 %rd1921, %r6807, 1792; | |
add.s64 %rd1922, %rd415, %rd1921; | |
mul.wide.u32 %rd1923, %r6808, 28; | |
add.s64 %rd1924, %rd1922, %rd1923; | |
ld.global.u32 %r6809, [%rd1924]; | |
and.b32 %r6810, %r6809, 65535; | |
bfe.u32 %r6811, %r6809, 16, 6; | |
mul.wide.u32 %rd1925, %r6810, 1792; | |
add.s64 %rd1926, %rd414, %rd1925; | |
mul.wide.u32 %rd1927, %r6811, 28; | |
add.s64 %rd1928, %rd1926, %rd1927; | |
ld.global.u32 %r6812, [%rd1928]; | |
and.b32 %r6813, %r6812, 65535; | |
shl.b32 %r6814, %r6813, 6; | |
bfe.u32 %r6815, %r6812, 16, 6; | |
or.b32 %r1670, %r6814, %r6815; | |
st.local.u32 [%rd2+832], %r1670; | |
bfe.u32 %r6816, %r6809, 22, 6; | |
mul.wide.u32 %rd1929, %r6816, 28; | |
add.s64 %rd1930, %rd1926, %rd1929; | |
ld.global.u32 %r6817, [%rd1930]; | |
and.b32 %r6818, %r6817, 65535; | |
shl.b32 %r6819, %r6818, 6; | |
bfe.u32 %r6820, %r6817, 16, 6; | |
or.b32 %r16322, %r6819, %r6820; | |
st.local.u32 [%rd2+836], %r16322; | |
setp.le.u32 %p212, %r1670, %r16322; | |
mov.u32 %r16321, %r1670; | |
@%p212 bra BB12_420; | |
st.local.v2.u32 [%rd2+832], {%r16322, %r1670}; | |
mov.u32 %r14933, %r16322; | |
mov.u32 %r16322, %r1670; | |
mov.u32 %r16321, %r14933; | |
BB12_420: | |
mov.u32 %r16317, %r16321; | |
mov.u32 %r16318, %r16322; | |
bfe.u32 %r6821, %r1669, 22, 6; | |
mul.lo.s64 %rd1931, %rd122, 1792; | |
add.s64 %rd1932, %rd415, %rd1931; | |
mul.wide.u32 %rd1933, %r6821, 28; | |
add.s64 %rd1934, %rd1932, %rd1933; | |
ld.global.u32 %r6822, [%rd1934]; | |
and.b32 %r6823, %r6822, 65535; | |
bfe.u32 %r6824, %r6822, 16, 6; | |
mul.wide.u32 %rd1935, %r6823, 1792; | |
add.s64 %rd1936, %rd414, %rd1935; | |
mul.wide.u32 %rd1937, %r6824, 28; | |
add.s64 %rd1938, %rd1936, %rd1937; | |
ld.global.u32 %r6825, [%rd1938]; | |
and.b32 %r6826, %r6825, 65535; | |
shl.b32 %r6827, %r6826, 6; | |
bfe.u32 %r6828, %r6825, 16, 6; | |
or.b32 %r1674, %r6827, %r6828; | |
st.local.u32 [%rd2+840], %r1674; | |
bfe.u32 %r6829, %r6822, 22, 6; | |
mul.wide.u32 %rd1939, %r6829, 28; | |
add.s64 %rd1940, %rd1936, %rd1939; | |
ld.global.u32 %r6830, [%rd1940]; | |
and.b32 %r6831, %r6830, 65535; | |
shl.b32 %r6832, %r6831, 6; | |
bfe.u32 %r6833, %r6830, 16, 6; | |
or.b32 %r16324, %r6832, %r6833; | |
st.local.u32 [%rd2+844], %r16324; | |
setp.le.u32 %p213, %r1674, %r16324; | |
mov.u32 %r16323, %r1674; | |
@%p213 bra BB12_422; | |
st.local.v2.u32 [%rd2+840], {%r16324, %r1674}; | |
mov.u32 %r14939, %r16324; | |
mov.u32 %r16324, %r1674; | |
mov.u32 %r16323, %r14939; | |
BB12_422: | |
mov.u32 %r1677, %r16323; | |
mov.u32 %r1676, %r16324; | |
setp.le.u32 %p214, %r16317, %r1677; | |
mov.u32 %r16319, %r1677; | |
mov.u32 %r16320, %r1676; | |
@%p214 bra BB12_424; | |
st.local.v4.u32 [%rd2+832], {%r1677, %r1676, %r16317, %r16318}; | |
mov.u32 %r14936, %r16318; | |
mov.u32 %r14938, %r16317; | |
mov.u32 %r16318, %r1676; | |
mov.u32 %r16317, %r1677; | |
mov.u32 %r16319, %r14938; | |
mov.u32 %r16320, %r14936; | |
BB12_424: | |
mov.u32 %r16309, %r16317; | |
mov.u32 %r16310, %r16318; | |
mov.u32 %r16311, %r16319; | |
mov.u32 %r16312, %r16320; | |
mul.lo.s64 %rd1941, %rd121, 1792; | |
add.s64 %rd1942, %rd4, %rd1941; | |
bfe.u32 %r6834, %r1668, 22, 6; | |
mul.wide.u32 %rd1943, %r6834, 28; | |
add.s64 %rd1944, %rd1942, %rd1943; | |
ld.global.u32 %r1682, [%rd1944+-12]; | |
and.b32 %r6835, %r1682, 65535; | |
cvt.u64.u32 %rd123, %r6835; | |
bfe.u32 %r6836, %r1682, 16, 6; | |
mul.wide.u32 %rd1945, %r6835, 1792; | |
add.s64 %rd1946, %rd415, %rd1945; | |
mul.wide.u32 %rd1947, %r6836, 28; | |
add.s64 %rd1948, %rd1946, %rd1947; | |
ld.global.u32 %r6837, [%rd1948]; | |
and.b32 %r6838, %r6837, 65535; | |
bfe.u32 %r6839, %r6837, 16, 6; | |
mul.wide.u32 %rd1949, %r6838, 1792; | |
add.s64 %rd1950, %rd414, %rd1949; | |
mul.wide.u32 %rd1951, %r6839, 28; | |
add.s64 %rd1952, %rd1950, %rd1951; | |
ld.global.u32 %r6840, [%rd1952]; | |
and.b32 %r6841, %r6840, 65535; | |
shl.b32 %r6842, %r6841, 6; | |
bfe.u32 %r6843, %r6840, 16, 6; | |
or.b32 %r1683, %r6842, %r6843; | |
st.local.u32 [%rd2+848], %r1683; | |
bfe.u32 %r6844, %r6837, 22, 6; | |
mul.wide.u32 %rd1953, %r6844, 28; | |
add.s64 %rd1954, %rd1950, %rd1953; | |
ld.global.u32 %r6845, [%rd1954]; | |
and.b32 %r6846, %r6845, 65535; | |
shl.b32 %r6847, %r6846, 6; | |
bfe.u32 %r6848, %r6845, 16, 6; | |
or.b32 %r16330, %r6847, %r6848; | |
st.local.u32 [%rd2+852], %r16330; | |
setp.le.u32 %p215, %r1683, %r16330; | |
mov.u32 %r16329, %r1683; | |
@%p215 bra BB12_426; | |
st.local.v2.u32 [%rd2+848], {%r16330, %r1683}; | |
mov.u32 %r14953, %r16330; | |
mov.u32 %r16330, %r1683; | |
mov.u32 %r16329, %r14953; | |
BB12_426: | |
mov.u32 %r16325, %r16329; | |
mov.u32 %r16326, %r16330; | |
bfe.u32 %r6849, %r1682, 22, 6; | |
mul.lo.s64 %rd1955, %rd123, 1792; | |
add.s64 %rd1956, %rd415, %rd1955; | |
mul.wide.u32 %rd1957, %r6849, 28; | |
add.s64 %rd1958, %rd1956, %rd1957; | |
ld.global.u32 %r6850, [%rd1958]; | |
and.b32 %r6851, %r6850, 65535; | |
bfe.u32 %r6852, %r6850, 16, 6; | |
mul.wide.u32 %rd1959, %r6851, 1792; | |
add.s64 %rd1960, %rd414, %rd1959; | |
mul.wide.u32 %rd1961, %r6852, 28; | |
add.s64 %rd1962, %rd1960, %rd1961; | |
ld.global.u32 %r6853, [%rd1962]; | |
and.b32 %r6854, %r6853, 65535; | |
shl.b32 %r6855, %r6854, 6; | |
bfe.u32 %r6856, %r6853, 16, 6; | |
or.b32 %r1687, %r6855, %r6856; | |
st.local.u32 [%rd2+856], %r1687; | |
bfe.u32 %r6857, %r6850, 22, 6; | |
mul.wide.u32 %rd1963, %r6857, 28; | |
add.s64 %rd1964, %rd1960, %rd1963; | |
ld.global.u32 %r6858, [%rd1964]; | |
and.b32 %r6859, %r6858, 65535; | |
shl.b32 %r6860, %r6859, 6; | |
bfe.u32 %r6861, %r6858, 16, 6; | |
or.b32 %r16332, %r6860, %r6861; | |
st.local.u32 [%rd2+860], %r16332; | |
setp.le.u32 %p216, %r1687, %r16332; | |
mov.u32 %r16331, %r1687; | |
@%p216 bra BB12_428; | |
st.local.v2.u32 [%rd2+856], {%r16332, %r1687}; | |
mov.u32 %r14959, %r16332; | |
mov.u32 %r16332, %r1687; | |
mov.u32 %r16331, %r14959; | |
BB12_428: | |
mov.u32 %r1690, %r16331; | |
mov.u32 %r1689, %r16332; | |
setp.le.u32 %p217, %r16325, %r1690; | |
mov.u32 %r16327, %r1690; | |
mov.u32 %r16328, %r1689; | |
@%p217 bra BB12_430; | |
st.local.v4.u32 [%rd2+848], {%r1690, %r1689, %r16325, %r16326}; | |
mov.u32 %r14956, %r16326; | |
mov.u32 %r14958, %r16325; | |
mov.u32 %r16326, %r1689; | |
mov.u32 %r16325, %r1690; | |
mov.u32 %r16327, %r14958; | |
mov.u32 %r16328, %r14956; | |
BB12_430: | |
mov.u32 %r1694, %r16325; | |
mov.u32 %r1693, %r16326; | |
mov.u32 %r1692, %r16327; | |
mov.u32 %r1691, %r16328; | |
setp.le.u32 %p218, %r16309, %r1694; | |
mov.u32 %r16313, %r1694; | |
mov.u32 %r16314, %r1693; | |
mov.u32 %r16315, %r1692; | |
mov.u32 %r16316, %r1691; | |
@%p218 bra BB12_432; | |
st.local.v4.u32 [%rd2+832], {%r1694, %r1693, %r1692, %r1691}; | |
st.local.v4.u32 [%rd2+848], {%r16309, %r16310, %r16311, %r16312}; | |
mov.u32 %r14946, %r16312; | |
mov.u32 %r14948, %r16311; | |
mov.u32 %r14950, %r16310; | |
mov.u32 %r14952, %r16309; | |
mov.u32 %r16312, %r1691; | |
mov.u32 %r16311, %r1692; | |
mov.u32 %r16310, %r1693; | |
mov.u32 %r16309, %r1694; | |
mov.u32 %r16313, %r14952; | |
mov.u32 %r16314, %r14950; | |
mov.u32 %r16315, %r14948; | |
mov.u32 %r16316, %r14946; | |
BB12_432: | |
mov.u32 %r16293, %r16309; | |
mov.u32 %r16294, %r16310; | |
mov.u32 %r16295, %r16311; | |
mov.u32 %r16296, %r16312; | |
mov.u32 %r16297, %r16313; | |
mov.u32 %r16298, %r16314; | |
mov.u32 %r16299, %r16315; | |
mov.u32 %r16300, %r16316; | |
mul.lo.s64 %rd1965, %rd120, 1792; | |
add.s64 %rd1966, %rd6, %rd1965; | |
bfe.u32 %r6862, %r1667, 22, 6; | |
mul.wide.u32 %rd1967, %r6862, 28; | |
add.s64 %rd1968, %rd1966, %rd1967; | |
ld.global.u32 %r1703, [%rd1968+-8]; | |
and.b32 %r6863, %r1703, 65535; | |
mul.wide.u32 %rd1969, %r6863, 1792; | |
add.s64 %rd1970, %rd4, %rd1969; | |
cvt.u64.u32 %rd124, %r6863; | |
bfe.u32 %r6864, %r1703, 16, 6; | |
mul.wide.u32 %rd1971, %r6864, 28; | |
add.s64 %rd1972, %rd1970, %rd1971; | |
ld.global.u32 %r1704, [%rd1972+-12]; | |
and.b32 %r6865, %r1704, 65535; | |
cvt.u64.u32 %rd125, %r6865; | |
bfe.u32 %r6866, %r1704, 16, 6; | |
mul.wide.u32 %rd1973, %r6865, 1792; | |
add.s64 %rd1974, %rd415, %rd1973; | |
mul.wide.u32 %rd1975, %r6866, 28; | |
add.s64 %rd1976, %rd1974, %rd1975; | |
ld.global.u32 %r6867, [%rd1976]; | |
and.b32 %r6868, %r6867, 65535; | |
bfe.u32 %r6869, %r6867, 16, 6; | |
mul.wide.u32 %rd1977, %r6868, 1792; | |
add.s64 %rd1978, %rd414, %rd1977; | |
mul.wide.u32 %rd1979, %r6869, 28; | |
add.s64 %rd1980, %rd1978, %rd1979; | |
ld.global.u32 %r6870, [%rd1980]; | |
and.b32 %r6871, %r6870, 65535; | |
shl.b32 %r6872, %r6871, 6; | |
bfe.u32 %r6873, %r6870, 16, 6; | |
or.b32 %r1705, %r6872, %r6873; | |
st.local.u32 [%rd2+864], %r1705; | |
bfe.u32 %r6874, %r6867, 22, 6; | |
mul.wide.u32 %rd1981, %r6874, 28; | |
add.s64 %rd1982, %rd1978, %rd1981; | |
ld.global.u32 %r6875, [%rd1982]; | |
and.b32 %r6876, %r6875, 65535; | |
shl.b32 %r6877, %r6876, 6; | |
bfe.u32 %r6878, %r6875, 16, 6; | |
or.b32 %r16346, %r6877, %r6878; | |
st.local.u32 [%rd2+868], %r16346; | |
setp.le.u32 %p219, %r1705, %r16346; | |
mov.u32 %r16345, %r1705; | |
@%p219 bra BB12_434; | |
st.local.v2.u32 [%rd2+864], {%r16346, %r1705}; | |
mov.u32 %r14989, %r16346; | |
mov.u32 %r16346, %r1705; | |
mov.u32 %r16345, %r14989; | |
BB12_434: | |
mov.u32 %r16341, %r16345; | |
mov.u32 %r16342, %r16346; | |
bfe.u32 %r6879, %r1704, 22, 6; | |
mul.lo.s64 %rd1983, %rd125, 1792; | |
add.s64 %rd1984, %rd415, %rd1983; | |
mul.wide.u32 %rd1985, %r6879, 28; | |
add.s64 %rd1986, %rd1984, %rd1985; | |
ld.global.u32 %r6880, [%rd1986]; | |
and.b32 %r6881, %r6880, 65535; | |
bfe.u32 %r6882, %r6880, 16, 6; | |
mul.wide.u32 %rd1987, %r6881, 1792; | |
add.s64 %rd1988, %rd414, %rd1987; | |
mul.wide.u32 %rd1989, %r6882, 28; | |
add.s64 %rd1990, %rd1988, %rd1989; | |
ld.global.u32 %r6883, [%rd1990]; | |
and.b32 %r6884, %r6883, 65535; | |
shl.b32 %r6885, %r6884, 6; | |
bfe.u32 %r6886, %r6883, 16, 6; | |
or.b32 %r1709, %r6885, %r6886; | |
st.local.u32 [%rd2+872], %r1709; | |
bfe.u32 %r6887, %r6880, 22, 6; | |
mul.wide.u32 %rd1991, %r6887, 28; | |
add.s64 %rd1992, %rd1988, %rd1991; | |
ld.global.u32 %r6888, [%rd1992]; | |
and.b32 %r6889, %r6888, 65535; | |
shl.b32 %r6890, %r6889, 6; | |
bfe.u32 %r6891, %r6888, 16, 6; | |
or.b32 %r16348, %r6890, %r6891; | |
st.local.u32 [%rd2+876], %r16348; | |
setp.le.u32 %p220, %r1709, %r16348; | |
mov.u32 %r16347, %r1709; | |
@%p220 bra BB12_436; | |
st.local.v2.u32 [%rd2+872], {%r16348, %r1709}; | |
mov.u32 %r14995, %r16348; | |
mov.u32 %r16348, %r1709; | |
mov.u32 %r16347, %r14995; | |
BB12_436: | |
mov.u32 %r1712, %r16347; | |
mov.u32 %r1711, %r16348; | |
setp.le.u32 %p221, %r16341, %r1712; | |
mov.u32 %r16343, %r1712; | |
mov.u32 %r16344, %r1711; | |
@%p221 bra BB12_438; | |
st.local.v4.u32 [%rd2+864], {%r1712, %r1711, %r16341, %r16342}; | |
mov.u32 %r14992, %r16342; | |
mov.u32 %r14994, %r16341; | |
mov.u32 %r16342, %r1711; | |
mov.u32 %r16341, %r1712; | |
mov.u32 %r16343, %r14994; | |
mov.u32 %r16344, %r14992; | |
BB12_438: | |
mov.u32 %r16333, %r16341; | |
mov.u32 %r16334, %r16342; | |
mov.u32 %r16335, %r16343; | |
mov.u32 %r16336, %r16344; | |
mul.lo.s64 %rd1993, %rd124, 1792; | |
add.s64 %rd1994, %rd4, %rd1993; | |
bfe.u32 %r6892, %r1703, 22, 6; | |
mul.wide.u32 %rd1995, %r6892, 28; | |
add.s64 %rd1996, %rd1994, %rd1995; | |
ld.global.u32 %r1717, [%rd1996+-12]; | |
and.b32 %r6893, %r1717, 65535; | |
cvt.u64.u32 %rd126, %r6893; | |
bfe.u32 %r6894, %r1717, 16, 6; | |
mul.wide.u32 %rd1997, %r6893, 1792; | |
add.s64 %rd1998, %rd415, %rd1997; | |
mul.wide.u32 %rd1999, %r6894, 28; | |
add.s64 %rd2000, %rd1998, %rd1999; | |
ld.global.u32 %r6895, [%rd2000]; | |
and.b32 %r6896, %r6895, 65535; | |
bfe.u32 %r6897, %r6895, 16, 6; | |
mul.wide.u32 %rd2001, %r6896, 1792; | |
add.s64 %rd2002, %rd414, %rd2001; | |
mul.wide.u32 %rd2003, %r6897, 28; | |
add.s64 %rd2004, %rd2002, %rd2003; | |
ld.global.u32 %r6898, [%rd2004]; | |
and.b32 %r6899, %r6898, 65535; | |
shl.b32 %r6900, %r6899, 6; | |
bfe.u32 %r6901, %r6898, 16, 6; | |
or.b32 %r1718, %r6900, %r6901; | |
st.local.u32 [%rd2+880], %r1718; | |
bfe.u32 %r6902, %r6895, 22, 6; | |
mul.wide.u32 %rd2005, %r6902, 28; | |
add.s64 %rd2006, %rd2002, %rd2005; | |
ld.global.u32 %r6903, [%rd2006]; | |
and.b32 %r6904, %r6903, 65535; | |
shl.b32 %r6905, %r6904, 6; | |
bfe.u32 %r6906, %r6903, 16, 6; | |
or.b32 %r16354, %r6905, %r6906; | |
st.local.u32 [%rd2+884], %r16354; | |
setp.le.u32 %p222, %r1718, %r16354; | |
mov.u32 %r16353, %r1718; | |
@%p222 bra BB12_440; | |
st.local.v2.u32 [%rd2+880], {%r16354, %r1718}; | |
mov.u32 %r15009, %r16354; | |
mov.u32 %r16354, %r1718; | |
mov.u32 %r16353, %r15009; | |
BB12_440: | |
mov.u32 %r16349, %r16353; | |
mov.u32 %r16350, %r16354; | |
bfe.u32 %r6907, %r1717, 22, 6; | |
mul.lo.s64 %rd2007, %rd126, 1792; | |
add.s64 %rd2008, %rd415, %rd2007; | |
mul.wide.u32 %rd2009, %r6907, 28; | |
add.s64 %rd2010, %rd2008, %rd2009; | |
ld.global.u32 %r6908, [%rd2010]; | |
and.b32 %r6909, %r6908, 65535; | |
bfe.u32 %r6910, %r6908, 16, 6; | |
mul.wide.u32 %rd2011, %r6909, 1792; | |
add.s64 %rd2012, %rd414, %rd2011; | |
mul.wide.u32 %rd2013, %r6910, 28; | |
add.s64 %rd2014, %rd2012, %rd2013; | |
ld.global.u32 %r6911, [%rd2014]; | |
and.b32 %r6912, %r6911, 65535; | |
shl.b32 %r6913, %r6912, 6; | |
bfe.u32 %r6914, %r6911, 16, 6; | |
or.b32 %r1722, %r6913, %r6914; | |
st.local.u32 [%rd2+888], %r1722; | |
bfe.u32 %r6915, %r6908, 22, 6; | |
mul.wide.u32 %rd2015, %r6915, 28; | |
add.s64 %rd2016, %rd2012, %rd2015; | |
ld.global.u32 %r6916, [%rd2016]; | |
and.b32 %r6917, %r6916, 65535; | |
shl.b32 %r6918, %r6917, 6; | |
bfe.u32 %r6919, %r6916, 16, 6; | |
or.b32 %r16356, %r6918, %r6919; | |
st.local.u32 [%rd2+892], %r16356; | |
setp.le.u32 %p223, %r1722, %r16356; | |
mov.u32 %r16355, %r1722; | |
@%p223 bra BB12_442; | |
st.local.v2.u32 [%rd2+888], {%r16356, %r1722}; | |
mov.u32 %r15015, %r16356; | |
mov.u32 %r16356, %r1722; | |
mov.u32 %r16355, %r15015; | |
BB12_442: | |
mov.u32 %r1725, %r16355; | |
mov.u32 %r1724, %r16356; | |
setp.le.u32 %p224, %r16349, %r1725; | |
mov.u32 %r16351, %r1725; | |
mov.u32 %r16352, %r1724; | |
@%p224 bra BB12_444; | |
st.local.v4.u32 [%rd2+880], {%r1725, %r1724, %r16349, %r16350}; | |
mov.u32 %r15012, %r16350; | |
mov.u32 %r15014, %r16349; | |
mov.u32 %r16350, %r1724; | |
mov.u32 %r16349, %r1725; | |
mov.u32 %r16351, %r15014; | |
mov.u32 %r16352, %r15012; | |
BB12_444: | |
mov.u32 %r1729, %r16349; | |
mov.u32 %r1728, %r16350; | |
mov.u32 %r1727, %r16351; | |
mov.u32 %r1726, %r16352; | |
setp.le.u32 %p225, %r16333, %r1729; | |
mov.u32 %r16337, %r1729; | |
mov.u32 %r16338, %r1728; | |
mov.u32 %r16339, %r1727; | |
mov.u32 %r16340, %r1726; | |
@%p225 bra BB12_446; | |
st.local.v4.u32 [%rd2+864], {%r1729, %r1728, %r1727, %r1726}; | |
st.local.v4.u32 [%rd2+880], {%r16333, %r16334, %r16335, %r16336}; | |
mov.u32 %r15002, %r16336; | |
mov.u32 %r15004, %r16335; | |
mov.u32 %r15006, %r16334; | |
mov.u32 %r15008, %r16333; | |
mov.u32 %r16336, %r1726; | |
mov.u32 %r16335, %r1727; | |
mov.u32 %r16334, %r1728; | |
mov.u32 %r16333, %r1729; | |
mov.u32 %r16337, %r15008; | |
mov.u32 %r16338, %r15006; | |
mov.u32 %r16339, %r15004; | |
mov.u32 %r16340, %r15002; | |
BB12_446: | |
mov.u32 %r1737, %r16333; | |
mov.u32 %r1736, %r16334; | |
mov.u32 %r1735, %r16335; | |
mov.u32 %r1734, %r16336; | |
mov.u32 %r1733, %r16337; | |
mov.u32 %r1732, %r16338; | |
mov.u32 %r1731, %r16339; | |
mov.u32 %r1730, %r16340; | |
setp.le.u32 %p226, %r16293, %r1737; | |
mov.u32 %r16301, %r1737; | |
mov.u32 %r16302, %r1736; | |
mov.u32 %r16303, %r1735; | |
mov.u32 %r16304, %r1734; | |
mov.u32 %r16305, %r1733; | |
mov.u32 %r16306, %r1732; | |
mov.u32 %r16307, %r1731; | |
mov.u32 %r16308, %r1730; | |
@%p226 bra BB12_448; | |
st.local.v4.u32 [%rd2+832], {%r1737, %r1736, %r1735, %r1734}; | |
st.local.v4.u32 [%rd2+864], {%r16293, %r16294, %r16295, %r16296}; | |
st.local.v4.u32 [%rd2+848], {%r1733, %r1732, %r1731, %r1730}; | |
st.local.v4.u32 [%rd2+880], {%r16297, %r16298, %r16299, %r16300}; | |
mov.u32 %r14974, %r16300; | |
mov.u32 %r14976, %r16299; | |
mov.u32 %r14978, %r16298; | |
mov.u32 %r14980, %r16297; | |
mov.u32 %r14982, %r16296; | |
mov.u32 %r14984, %r16295; | |
mov.u32 %r14986, %r16294; | |
mov.u32 %r14988, %r16293; | |
mov.u32 %r16300, %r1730; | |
mov.u32 %r16299, %r1731; | |
mov.u32 %r16298, %r1732; | |
mov.u32 %r16297, %r1733; | |
mov.u32 %r16296, %r1734; | |
mov.u32 %r16295, %r1735; | |
mov.u32 %r16294, %r1736; | |
mov.u32 %r16293, %r1737; | |
mov.u32 %r16301, %r14988; | |
mov.u32 %r16302, %r14986; | |
mov.u32 %r16303, %r14984; | |
mov.u32 %r16304, %r14982; | |
mov.u32 %r16305, %r14980; | |
mov.u32 %r16306, %r14978; | |
mov.u32 %r16307, %r14976; | |
mov.u32 %r16308, %r14974; | |
BB12_448: | |
mov.u32 %r1753, %r16293; | |
mov.u32 %r1752, %r16294; | |
mov.u32 %r1751, %r16295; | |
mov.u32 %r1750, %r16296; | |
mov.u32 %r1749, %r16297; | |
mov.u32 %r1748, %r16298; | |
mov.u32 %r1747, %r16299; | |
mov.u32 %r1746, %r16300; | |
mov.u32 %r1745, %r16301; | |
mov.u32 %r1744, %r16302; | |
mov.u32 %r1743, %r16303; | |
mov.u32 %r1742, %r16304; | |
mov.u32 %r1741, %r16305; | |
mov.u32 %r1740, %r16306; | |
mov.u32 %r1739, %r16307; | |
mov.u32 %r1738, %r16308; | |
setp.le.u32 %p227, %r16197, %r1753; | |
mov.u32 %r16213, %r1753; | |
mov.u32 %r16214, %r1752; | |
mov.u32 %r16215, %r1751; | |
mov.u32 %r16216, %r1750; | |
mov.u32 %r16217, %r1749; | |
mov.u32 %r16218, %r1748; | |
mov.u32 %r16219, %r1747; | |
mov.u32 %r16220, %r1746; | |
mov.u32 %r16221, %r1745; | |
mov.u32 %r16222, %r1744; | |
mov.u32 %r16223, %r1743; | |
mov.u32 %r16224, %r1742; | |
mov.u32 %r16225, %r1741; | |
mov.u32 %r16226, %r1740; | |
mov.u32 %r16227, %r1739; | |
mov.u32 %r16228, %r1738; | |
@%p227 bra BB12_450; | |
st.local.v4.u32 [%rd2+768], {%r1753, %r1752, %r1751, %r1750}; | |
st.local.v4.u32 [%rd2+832], {%r16197, %r16198, %r16199, %r16200}; | |
st.local.v4.u32 [%rd2+784], {%r1749, %r1748, %r1747, %r1746}; | |
st.local.v4.u32 [%rd2+848], {%r16201, %r16202, %r16203, %r16204}; | |
st.local.v4.u32 [%rd2+800], {%r1745, %r1744, %r1743, %r1742}; | |
st.local.v4.u32 [%rd2+864], {%r16205, %r16206, %r16207, %r16208}; | |
st.local.v4.u32 [%rd2+816], {%r1741, %r1740, %r1739, %r1738}; | |
st.local.v4.u32 [%rd2+880], {%r16209, %r16210, %r16211, %r16212}; | |
mov.u32 %r14902, %r16212; | |
mov.u32 %r14904, %r16211; | |
mov.u32 %r14906, %r16210; | |
mov.u32 %r14908, %r16209; | |
mov.u32 %r14910, %r16208; | |
mov.u32 %r14912, %r16207; | |
mov.u32 %r14914, %r16206; | |
mov.u32 %r14916, %r16205; | |
mov.u32 %r14918, %r16204; | |
mov.u32 %r14920, %r16203; | |
mov.u32 %r14922, %r16202; | |
mov.u32 %r14924, %r16201; | |
mov.u32 %r14926, %r16200; | |
mov.u32 %r14928, %r16199; | |
mov.u32 %r14930, %r16198; | |
mov.u32 %r14932, %r16197; | |
mov.u32 %r16212, %r1738; | |
mov.u32 %r16211, %r1739; | |
mov.u32 %r16210, %r1740; | |
mov.u32 %r16209, %r1741; | |
mov.u32 %r16208, %r1742; | |
mov.u32 %r16207, %r1743; | |
mov.u32 %r16206, %r1744; | |
mov.u32 %r16205, %r1745; | |
mov.u32 %r16204, %r1746; | |
mov.u32 %r16203, %r1747; | |
mov.u32 %r16202, %r1748; | |
mov.u32 %r16201, %r1749; | |
mov.u32 %r16200, %r1750; | |
mov.u32 %r16199, %r1751; | |
mov.u32 %r16198, %r1752; | |
mov.u32 %r16197, %r1753; | |
mov.u32 %r16213, %r14932; | |
mov.u32 %r16214, %r14930; | |
mov.u32 %r16215, %r14928; | |
mov.u32 %r16216, %r14926; | |
mov.u32 %r16217, %r14924; | |
mov.u32 %r16218, %r14922; | |
mov.u32 %r16219, %r14920; | |
mov.u32 %r16220, %r14918; | |
mov.u32 %r16221, %r14916; | |
mov.u32 %r16222, %r14914; | |
mov.u32 %r16223, %r14912; | |
mov.u32 %r16224, %r14910; | |
mov.u32 %r16225, %r14908; | |
mov.u32 %r16226, %r14906; | |
mov.u32 %r16227, %r14904; | |
mov.u32 %r16228, %r14902; | |
BB12_450: | |
mov.u32 %r16133, %r16197; | |
mov.u32 %r16134, %r16198; | |
mov.u32 %r16135, %r16199; | |
mov.u32 %r16136, %r16200; | |
mov.u32 %r16137, %r16201; | |
mov.u32 %r16138, %r16202; | |
mov.u32 %r16139, %r16203; | |
mov.u32 %r16140, %r16204; | |
mov.u32 %r16141, %r16205; | |
mov.u32 %r16142, %r16206; | |
mov.u32 %r16143, %r16207; | |
mov.u32 %r16144, %r16208; | |
mov.u32 %r16145, %r16209; | |
mov.u32 %r16146, %r16210; | |
mov.u32 %r16147, %r16211; | |
mov.u32 %r16148, %r16212; | |
mov.u32 %r16149, %r16213; | |
mov.u32 %r16150, %r16214; | |
mov.u32 %r16151, %r16215; | |
mov.u32 %r16152, %r16216; | |
mov.u32 %r16153, %r16217; | |
mov.u32 %r16154, %r16218; | |
mov.u32 %r16155, %r16219; | |
mov.u32 %r16156, %r16220; | |
mov.u32 %r16157, %r16221; | |
mov.u32 %r16158, %r16222; | |
mov.u32 %r16159, %r16223; | |
mov.u32 %r16160, %r16224; | |
mov.u32 %r16161, %r16225; | |
mov.u32 %r16162, %r16226; | |
mov.u32 %r16163, %r16227; | |
mov.u32 %r16164, %r16228; | |
mul.lo.s64 %rd2017, %rd111, 1792; | |
add.s64 %rd2018, %rd6, %rd2017; | |
bfe.u32 %r6920, %r1578, 22, 6; | |
mul.wide.u32 %rd2019, %r6920, 28; | |
add.s64 %rd2020, %rd2018, %rd2019; | |
ld.global.u32 %r1786, [%rd2020+-4]; | |
and.b32 %r6921, %r1786, 65535; | |
mul.wide.u32 %rd2021, %r6921, 1792; | |
add.s64 %rd2022, %rd4, %rd2021; | |
bfe.u32 %r6922, %r1786, 16, 6; | |
mul.wide.u32 %rd2023, %r6922, 28; | |
add.s64 %rd2024, %rd2022, %rd2023; | |
ld.global.u32 %r1787, [%rd2024+-8]; | |
and.b32 %r6923, %r1787, 65535; | |
mul.wide.u32 %rd2025, %r6923, 1792; | |
add.s64 %rd2026, %rd6, %rd2025; | |
bfe.u32 %r6924, %r1787, 16, 6; | |
mul.wide.u32 %rd2027, %r6924, 28; | |
add.s64 %rd2028, %rd2026, %rd2027; | |
ld.global.u32 %r1788, [%rd2028+-8]; | |
and.b32 %r6925, %r1788, 65535; | |
mul.wide.u32 %rd2029, %r6925, 1792; | |
add.s64 %rd2030, %rd4, %rd2029; | |
cvt.u64.u32 %rd127, %r6921; | |
cvt.u64.u32 %rd128, %r6923; | |
cvt.u64.u32 %rd129, %r6925; | |
bfe.u32 %r6926, %r1788, 16, 6; | |
mul.wide.u32 %rd2031, %r6926, 28; | |
add.s64 %rd2032, %rd2030, %rd2031; | |
ld.global.u32 %r1789, [%rd2032+-12]; | |
and.b32 %r6927, %r1789, 65535; | |
cvt.u64.u32 %rd130, %r6927; | |
bfe.u32 %r6928, %r1789, 16, 6; | |
mul.wide.u32 %rd2033, %r6927, 1792; | |
add.s64 %rd2034, %rd415, %rd2033; | |
mul.wide.u32 %rd2035, %r6928, 28; | |
add.s64 %rd2036, %rd2034, %rd2035; | |
ld.global.u32 %r6929, [%rd2036]; | |
and.b32 %r6930, %r6929, 65535; | |
bfe.u32 %r6931, %r6929, 16, 6; | |
mul.wide.u32 %rd2037, %r6930, 1792; | |
add.s64 %rd2038, %rd414, %rd2037; | |
mul.wide.u32 %rd2039, %r6931, 28; | |
add.s64 %rd2040, %rd2038, %rd2039; | |
ld.global.u32 %r6932, [%rd2040]; | |
and.b32 %r6933, %r6932, 65535; | |
shl.b32 %r6934, %r6933, 6; | |
bfe.u32 %r6935, %r6932, 16, 6; | |
or.b32 %r1790, %r6934, %r6935; | |
st.local.u32 [%rd2+896], %r1790; | |
bfe.u32 %r6936, %r6929, 22, 6; | |
mul.wide.u32 %rd2041, %r6936, 28; | |
add.s64 %rd2042, %rd2038, %rd2041; | |
ld.global.u32 %r6937, [%rd2042]; | |
and.b32 %r6938, %r6937, 65535; | |
shl.b32 %r6939, %r6938, 6; | |
bfe.u32 %r6940, %r6937, 16, 6; | |
or.b32 %r16418, %r6939, %r6940; | |
st.local.u32 [%rd2+900], %r16418; | |
setp.le.u32 %p228, %r1790, %r16418; | |
mov.u32 %r16417, %r1790; | |
@%p228 bra BB12_452; | |
st.local.v2.u32 [%rd2+896], {%r16418, %r1790}; | |
mov.u32 %r15141, %r16418; | |
mov.u32 %r16418, %r1790; | |
mov.u32 %r16417, %r15141; | |
BB12_452: | |
mov.u32 %r16413, %r16417; | |
mov.u32 %r16414, %r16418; | |
bfe.u32 %r6941, %r1789, 22, 6; | |
mul.lo.s64 %rd2043, %rd130, 1792; | |
add.s64 %rd2044, %rd415, %rd2043; | |
mul.wide.u32 %rd2045, %r6941, 28; | |
add.s64 %rd2046, %rd2044, %rd2045; | |
ld.global.u32 %r6942, [%rd2046]; | |
and.b32 %r6943, %r6942, 65535; | |
bfe.u32 %r6944, %r6942, 16, 6; | |
mul.wide.u32 %rd2047, %r6943, 1792; | |
add.s64 %rd2048, %rd414, %rd2047; | |
mul.wide.u32 %rd2049, %r6944, 28; | |
add.s64 %rd2050, %rd2048, %rd2049; | |
ld.global.u32 %r6945, [%rd2050]; | |
and.b32 %r6946, %r6945, 65535; | |
shl.b32 %r6947, %r6946, 6; | |
bfe.u32 %r6948, %r6945, 16, 6; | |
or.b32 %r1794, %r6947, %r6948; | |
st.local.u32 [%rd2+904], %r1794; | |
bfe.u32 %r6949, %r6942, 22, 6; | |
mul.wide.u32 %rd2051, %r6949, 28; | |
add.s64 %rd2052, %rd2048, %rd2051; | |
ld.global.u32 %r6950, [%rd2052]; | |
and.b32 %r6951, %r6950, 65535; | |
shl.b32 %r6952, %r6951, 6; | |
bfe.u32 %r6953, %r6950, 16, 6; | |
or.b32 %r16420, %r6952, %r6953; | |
st.local.u32 [%rd2+908], %r16420; | |
setp.le.u32 %p229, %r1794, %r16420; | |
mov.u32 %r16419, %r1794; | |
@%p229 bra BB12_454; | |
st.local.v2.u32 [%rd2+904], {%r16420, %r1794}; | |
mov.u32 %r15147, %r16420; | |
mov.u32 %r16420, %r1794; | |
mov.u32 %r16419, %r15147; | |
BB12_454: | |
mov.u32 %r1797, %r16419; | |
mov.u32 %r1796, %r16420; | |
setp.le.u32 %p230, %r16413, %r1797; | |
mov.u32 %r16415, %r1797; | |
mov.u32 %r16416, %r1796; | |
@%p230 bra BB12_456; | |
st.local.v4.u32 [%rd2+896], {%r1797, %r1796, %r16413, %r16414}; | |
mov.u32 %r15144, %r16414; | |
mov.u32 %r15146, %r16413; | |
mov.u32 %r16414, %r1796; | |
mov.u32 %r16413, %r1797; | |
mov.u32 %r16415, %r15146; | |
mov.u32 %r16416, %r15144; | |
BB12_456: | |
mov.u32 %r16405, %r16413; | |
mov.u32 %r16406, %r16414; | |
mov.u32 %r16407, %r16415; | |
mov.u32 %r16408, %r16416; | |
mul.lo.s64 %rd2053, %rd129, 1792; | |
add.s64 %rd2054, %rd4, %rd2053; | |
bfe.u32 %r6954, %r1788, 22, 6; | |
mul.wide.u32 %rd2055, %r6954, 28; | |
add.s64 %rd2056, %rd2054, %rd2055; | |
ld.global.u32 %r1802, [%rd2056+-12]; | |
and.b32 %r6955, %r1802, 65535; | |
cvt.u64.u32 %rd131, %r6955; | |
bfe.u32 %r6956, %r1802, 16, 6; | |
mul.wide.u32 %rd2057, %r6955, 1792; | |
add.s64 %rd2058, %rd415, %rd2057; | |
mul.wide.u32 %rd2059, %r6956, 28; | |
add.s64 %rd2060, %rd2058, %rd2059; | |
ld.global.u32 %r6957, [%rd2060]; | |
and.b32 %r6958, %r6957, 65535; | |
bfe.u32 %r6959, %r6957, 16, 6; | |
mul.wide.u32 %rd2061, %r6958, 1792; | |
add.s64 %rd2062, %rd414, %rd2061; | |
mul.wide.u32 %rd2063, %r6959, 28; | |
add.s64 %rd2064, %rd2062, %rd2063; | |
ld.global.u32 %r6960, [%rd2064]; | |
and.b32 %r6961, %r6960, 65535; | |
shl.b32 %r6962, %r6961, 6; | |
bfe.u32 %r6963, %r6960, 16, 6; | |
or.b32 %r1803, %r6962, %r6963; | |
st.local.u32 [%rd2+912], %r1803; | |
bfe.u32 %r6964, %r6957, 22, 6; | |
mul.wide.u32 %rd2065, %r6964, 28; | |
add.s64 %rd2066, %rd2062, %rd2065; | |
ld.global.u32 %r6965, [%rd2066]; | |
and.b32 %r6966, %r6965, 65535; | |
shl.b32 %r6967, %r6966, 6; | |
bfe.u32 %r6968, %r6965, 16, 6; | |
or.b32 %r16426, %r6967, %r6968; | |
st.local.u32 [%rd2+916], %r16426; | |
setp.le.u32 %p231, %r1803, %r16426; | |
mov.u32 %r16425, %r1803; | |
@%p231 bra BB12_458; | |
st.local.v2.u32 [%rd2+912], {%r16426, %r1803}; | |
mov.u32 %r15161, %r16426; | |
mov.u32 %r16426, %r1803; | |
mov.u32 %r16425, %r15161; | |
BB12_458: | |
mov.u32 %r16421, %r16425; | |
mov.u32 %r16422, %r16426; | |
bfe.u32 %r6969, %r1802, 22, 6; | |
mul.lo.s64 %rd2067, %rd131, 1792; | |
add.s64 %rd2068, %rd415, %rd2067; | |
mul.wide.u32 %rd2069, %r6969, 28; | |
add.s64 %rd2070, %rd2068, %rd2069; | |
ld.global.u32 %r6970, [%rd2070]; | |
and.b32 %r6971, %r6970, 65535; | |
bfe.u32 %r6972, %r6970, 16, 6; | |
mul.wide.u32 %rd2071, %r6971, 1792; | |
add.s64 %rd2072, %rd414, %rd2071; | |
mul.wide.u32 %rd2073, %r6972, 28; | |
add.s64 %rd2074, %rd2072, %rd2073; | |
ld.global.u32 %r6973, [%rd2074]; | |
and.b32 %r6974, %r6973, 65535; | |
shl.b32 %r6975, %r6974, 6; | |
bfe.u32 %r6976, %r6973, 16, 6; | |
or.b32 %r1807, %r6975, %r6976; | |
st.local.u32 [%rd2+920], %r1807; | |
bfe.u32 %r6977, %r6970, 22, 6; | |
mul.wide.u32 %rd2075, %r6977, 28; | |
add.s64 %rd2076, %rd2072, %rd2075; | |
ld.global.u32 %r6978, [%rd2076]; | |
and.b32 %r6979, %r6978, 65535; | |
shl.b32 %r6980, %r6979, 6; | |
bfe.u32 %r6981, %r6978, 16, 6; | |
or.b32 %r16428, %r6980, %r6981; | |
st.local.u32 [%rd2+924], %r16428; | |
setp.le.u32 %p232, %r1807, %r16428; | |
mov.u32 %r16427, %r1807; | |
@%p232 bra BB12_460; | |
st.local.v2.u32 [%rd2+920], {%r16428, %r1807}; | |
mov.u32 %r15167, %r16428; | |
mov.u32 %r16428, %r1807; | |
mov.u32 %r16427, %r15167; | |
BB12_460: | |
mov.u32 %r1810, %r16427; | |
mov.u32 %r1809, %r16428; | |
setp.le.u32 %p233, %r16421, %r1810; | |
mov.u32 %r16423, %r1810; | |
mov.u32 %r16424, %r1809; | |
@%p233 bra BB12_462; | |
st.local.v4.u32 [%rd2+912], {%r1810, %r1809, %r16421, %r16422}; | |
mov.u32 %r15164, %r16422; | |
mov.u32 %r15166, %r16421; | |
mov.u32 %r16422, %r1809; | |
mov.u32 %r16421, %r1810; | |
mov.u32 %r16423, %r15166; | |
mov.u32 %r16424, %r15164; | |
BB12_462: | |
mov.u32 %r1814, %r16421; | |
mov.u32 %r1813, %r16422; | |
mov.u32 %r1812, %r16423; | |
mov.u32 %r1811, %r16424; | |
setp.le.u32 %p234, %r16405, %r1814; | |
mov.u32 %r16409, %r1814; | |
mov.u32 %r16410, %r1813; | |
mov.u32 %r16411, %r1812; | |
mov.u32 %r16412, %r1811; | |
@%p234 bra BB12_464; | |
st.local.v4.u32 [%rd2+896], {%r1814, %r1813, %r1812, %r1811}; | |
st.local.v4.u32 [%rd2+912], {%r16405, %r16406, %r16407, %r16408}; | |
mov.u32 %r15154, %r16408; | |
mov.u32 %r15156, %r16407; | |
mov.u32 %r15158, %r16406; | |
mov.u32 %r15160, %r16405; | |
mov.u32 %r16408, %r1811; | |
mov.u32 %r16407, %r1812; | |
mov.u32 %r16406, %r1813; | |
mov.u32 %r16405, %r1814; | |
mov.u32 %r16409, %r15160; | |
mov.u32 %r16410, %r15158; | |
mov.u32 %r16411, %r15156; | |
mov.u32 %r16412, %r15154; | |
BB12_464: | |
mov.u32 %r16389, %r16405; | |
mov.u32 %r16390, %r16406; | |
mov.u32 %r16391, %r16407; | |
mov.u32 %r16392, %r16408; | |
mov.u32 %r16393, %r16409; | |
mov.u32 %r16394, %r16410; | |
mov.u32 %r16395, %r16411; | |
mov.u32 %r16396, %r16412; | |
mul.lo.s64 %rd2077, %rd128, 1792; | |
add.s64 %rd2078, %rd6, %rd2077; | |
bfe.u32 %r6982, %r1787, 22, 6; | |
mul.wide.u32 %rd2079, %r6982, 28; | |
add.s64 %rd2080, %rd2078, %rd2079; | |
ld.global.u32 %r1823, [%rd2080+-8]; | |
and.b32 %r6983, %r1823, 65535; | |
mul.wide.u32 %rd2081, %r6983, 1792; | |
add.s64 %rd2082, %rd4, %rd2081; | |
cvt.u64.u32 %rd132, %r6983; | |
bfe.u32 %r6984, %r1823, 16, 6; | |
mul.wide.u32 %rd2083, %r6984, 28; | |
add.s64 %rd2084, %rd2082, %rd2083; | |
ld.global.u32 %r1824, [%rd2084+-12]; | |
and.b32 %r6985, %r1824, 65535; | |
cvt.u64.u32 %rd133, %r6985; | |
bfe.u32 %r6986, %r1824, 16, 6; | |
mul.wide.u32 %rd2085, %r6985, 1792; | |
add.s64 %rd2086, %rd415, %rd2085; | |
mul.wide.u32 %rd2087, %r6986, 28; | |
add.s64 %rd2088, %rd2086, %rd2087; | |
ld.global.u32 %r6987, [%rd2088]; | |
and.b32 %r6988, %r6987, 65535; | |
bfe.u32 %r6989, %r6987, 16, 6; | |
mul.wide.u32 %rd2089, %r6988, 1792; | |
add.s64 %rd2090, %rd414, %rd2089; | |
mul.wide.u32 %rd2091, %r6989, 28; | |
add.s64 %rd2092, %rd2090, %rd2091; | |
ld.global.u32 %r6990, [%rd2092]; | |
and.b32 %r6991, %r6990, 65535; | |
shl.b32 %r6992, %r6991, 6; | |
bfe.u32 %r6993, %r6990, 16, 6; | |
or.b32 %r1825, %r6992, %r6993; | |
st.local.u32 [%rd2+928], %r1825; | |
bfe.u32 %r6994, %r6987, 22, 6; | |
mul.wide.u32 %rd2093, %r6994, 28; | |
add.s64 %rd2094, %rd2090, %rd2093; | |
ld.global.u32 %r6995, [%rd2094]; | |
and.b32 %r6996, %r6995, 65535; | |
shl.b32 %r6997, %r6996, 6; | |
bfe.u32 %r6998, %r6995, 16, 6; | |
or.b32 %r16442, %r6997, %r6998; | |
st.local.u32 [%rd2+932], %r16442; | |
setp.le.u32 %p235, %r1825, %r16442; | |
mov.u32 %r16441, %r1825; | |
@%p235 bra BB12_466; | |
st.local.v2.u32 [%rd2+928], {%r16442, %r1825}; | |
mov.u32 %r15197, %r16442; | |
mov.u32 %r16442, %r1825; | |
mov.u32 %r16441, %r15197; | |
BB12_466: | |
mov.u32 %r16437, %r16441; | |
mov.u32 %r16438, %r16442; | |
bfe.u32 %r6999, %r1824, 22, 6; | |
mul.lo.s64 %rd2095, %rd133, 1792; | |
add.s64 %rd2096, %rd415, %rd2095; | |
mul.wide.u32 %rd2097, %r6999, 28; | |
add.s64 %rd2098, %rd2096, %rd2097; | |
ld.global.u32 %r7000, [%rd2098]; | |
and.b32 %r7001, %r7000, 65535; | |
bfe.u32 %r7002, %r7000, 16, 6; | |
mul.wide.u32 %rd2099, %r7001, 1792; | |
add.s64 %rd2100, %rd414, %rd2099; | |
mul.wide.u32 %rd2101, %r7002, 28; | |
add.s64 %rd2102, %rd2100, %rd2101; | |
ld.global.u32 %r7003, [%rd2102]; | |
and.b32 %r7004, %r7003, 65535; | |
shl.b32 %r7005, %r7004, 6; | |
bfe.u32 %r7006, %r7003, 16, 6; | |
or.b32 %r1829, %r7005, %r7006; | |
st.local.u32 [%rd2+936], %r1829; | |
bfe.u32 %r7007, %r7000, 22, 6; | |
mul.wide.u32 %rd2103, %r7007, 28; | |
add.s64 %rd2104, %rd2100, %rd2103; | |
ld.global.u32 %r7008, [%rd2104]; | |
and.b32 %r7009, %r7008, 65535; | |
shl.b32 %r7010, %r7009, 6; | |
bfe.u32 %r7011, %r7008, 16, 6; | |
or.b32 %r16444, %r7010, %r7011; | |
st.local.u32 [%rd2+940], %r16444; | |
setp.le.u32 %p236, %r1829, %r16444; | |
mov.u32 %r16443, %r1829; | |
@%p236 bra BB12_468; | |
st.local.v2.u32 [%rd2+936], {%r16444, %r1829}; | |
mov.u32 %r15203, %r16444; | |
mov.u32 %r16444, %r1829; | |
mov.u32 %r16443, %r15203; | |
BB12_468: | |
mov.u32 %r1832, %r16443; | |
mov.u32 %r1831, %r16444; | |
setp.le.u32 %p237, %r16437, %r1832; | |
mov.u32 %r16439, %r1832; | |
mov.u32 %r16440, %r1831; | |
@%p237 bra BB12_470; | |
st.local.v4.u32 [%rd2+928], {%r1832, %r1831, %r16437, %r16438}; | |
mov.u32 %r15200, %r16438; | |
mov.u32 %r15202, %r16437; | |
mov.u32 %r16438, %r1831; | |
mov.u32 %r16437, %r1832; | |
mov.u32 %r16439, %r15202; | |
mov.u32 %r16440, %r15200; | |
BB12_470: | |
mov.u32 %r16429, %r16437; | |
mov.u32 %r16430, %r16438; | |
mov.u32 %r16431, %r16439; | |
mov.u32 %r16432, %r16440; | |
mul.lo.s64 %rd2105, %rd132, 1792; | |
add.s64 %rd2106, %rd4, %rd2105; | |
bfe.u32 %r7012, %r1823, 22, 6; | |
mul.wide.u32 %rd2107, %r7012, 28; | |
add.s64 %rd2108, %rd2106, %rd2107; | |
ld.global.u32 %r1837, [%rd2108+-12]; | |
and.b32 %r7013, %r1837, 65535; | |
cvt.u64.u32 %rd134, %r7013; | |
bfe.u32 %r7014, %r1837, 16, 6; | |
mul.wide.u32 %rd2109, %r7013, 1792; | |
add.s64 %rd2110, %rd415, %rd2109; | |
mul.wide.u32 %rd2111, %r7014, 28; | |
add.s64 %rd2112, %rd2110, %rd2111; | |
ld.global.u32 %r7015, [%rd2112]; | |
and.b32 %r7016, %r7015, 65535; | |
bfe.u32 %r7017, %r7015, 16, 6; | |
mul.wide.u32 %rd2113, %r7016, 1792; | |
add.s64 %rd2114, %rd414, %rd2113; | |
mul.wide.u32 %rd2115, %r7017, 28; | |
add.s64 %rd2116, %rd2114, %rd2115; | |
ld.global.u32 %r7018, [%rd2116]; | |
and.b32 %r7019, %r7018, 65535; | |
shl.b32 %r7020, %r7019, 6; | |
bfe.u32 %r7021, %r7018, 16, 6; | |
or.b32 %r1838, %r7020, %r7021; | |
st.local.u32 [%rd2+944], %r1838; | |
bfe.u32 %r7022, %r7015, 22, 6; | |
mul.wide.u32 %rd2117, %r7022, 28; | |
add.s64 %rd2118, %rd2114, %rd2117; | |
ld.global.u32 %r7023, [%rd2118]; | |
and.b32 %r7024, %r7023, 65535; | |
shl.b32 %r7025, %r7024, 6; | |
bfe.u32 %r7026, %r7023, 16, 6; | |
or.b32 %r16450, %r7025, %r7026; | |
st.local.u32 [%rd2+948], %r16450; | |
setp.le.u32 %p238, %r1838, %r16450; | |
mov.u32 %r16449, %r1838; | |
@%p238 bra BB12_472; | |
st.local.v2.u32 [%rd2+944], {%r16450, %r1838}; | |
mov.u32 %r15217, %r16450; | |
mov.u32 %r16450, %r1838; | |
mov.u32 %r16449, %r15217; | |
BB12_472: | |
mov.u32 %r16445, %r16449; | |
mov.u32 %r16446, %r16450; | |
bfe.u32 %r7027, %r1837, 22, 6; | |
mul.lo.s64 %rd2119, %rd134, 1792; | |
add.s64 %rd2120, %rd415, %rd2119; | |
mul.wide.u32 %rd2121, %r7027, 28; | |
add.s64 %rd2122, %rd2120, %rd2121; | |
ld.global.u32 %r7028, [%rd2122]; | |
and.b32 %r7029, %r7028, 65535; | |
bfe.u32 %r7030, %r7028, 16, 6; | |
mul.wide.u32 %rd2123, %r7029, 1792; | |
add.s64 %rd2124, %rd414, %rd2123; | |
mul.wide.u32 %rd2125, %r7030, 28; | |
add.s64 %rd2126, %rd2124, %rd2125; | |
ld.global.u32 %r7031, [%rd2126]; | |
and.b32 %r7032, %r7031, 65535; | |
shl.b32 %r7033, %r7032, 6; | |
bfe.u32 %r7034, %r7031, 16, 6; | |
or.b32 %r1842, %r7033, %r7034; | |
st.local.u32 [%rd2+952], %r1842; | |
bfe.u32 %r7035, %r7028, 22, 6; | |
mul.wide.u32 %rd2127, %r7035, 28; | |
add.s64 %rd2128, %rd2124, %rd2127; | |
ld.global.u32 %r7036, [%rd2128]; | |
and.b32 %r7037, %r7036, 65535; | |
shl.b32 %r7038, %r7037, 6; | |
bfe.u32 %r7039, %r7036, 16, 6; | |
or.b32 %r16452, %r7038, %r7039; | |
st.local.u32 [%rd2+956], %r16452; | |
setp.le.u32 %p239, %r1842, %r16452; | |
mov.u32 %r16451, %r1842; | |
@%p239 bra BB12_474; | |
st.local.v2.u32 [%rd2+952], {%r16452, %r1842}; | |
mov.u32 %r15223, %r16452; | |
mov.u32 %r16452, %r1842; | |
mov.u32 %r16451, %r15223; | |
BB12_474: | |
mov.u32 %r1845, %r16451; | |
mov.u32 %r1844, %r16452; | |
setp.le.u32 %p240, %r16445, %r1845; | |
mov.u32 %r16447, %r1845; | |
mov.u32 %r16448, %r1844; | |
@%p240 bra BB12_476; | |
st.local.v4.u32 [%rd2+944], {%r1845, %r1844, %r16445, %r16446}; | |
mov.u32 %r15220, %r16446; | |
mov.u32 %r15222, %r16445; | |
mov.u32 %r16446, %r1844; | |
mov.u32 %r16445, %r1845; | |
mov.u32 %r16447, %r15222; | |
mov.u32 %r16448, %r15220; | |
BB12_476: | |
mov.u32 %r1849, %r16445; | |
mov.u32 %r1848, %r16446; | |
mov.u32 %r1847, %r16447; | |
mov.u32 %r1846, %r16448; | |
setp.le.u32 %p241, %r16429, %r1849; | |
mov.u32 %r16433, %r1849; | |
mov.u32 %r16434, %r1848; | |
mov.u32 %r16435, %r1847; | |
mov.u32 %r16436, %r1846; | |
@%p241 bra BB12_478; | |
st.local.v4.u32 [%rd2+928], {%r1849, %r1848, %r1847, %r1846}; | |
st.local.v4.u32 [%rd2+944], {%r16429, %r16430, %r16431, %r16432}; | |
mov.u32 %r15210, %r16432; | |
mov.u32 %r15212, %r16431; | |
mov.u32 %r15214, %r16430; | |
mov.u32 %r15216, %r16429; | |
mov.u32 %r16432, %r1846; | |
mov.u32 %r16431, %r1847; | |
mov.u32 %r16430, %r1848; | |
mov.u32 %r16429, %r1849; | |
mov.u32 %r16433, %r15216; | |
mov.u32 %r16434, %r15214; | |
mov.u32 %r16435, %r15212; | |
mov.u32 %r16436, %r15210; | |
BB12_478: | |
mov.u32 %r1857, %r16429; | |
mov.u32 %r1856, %r16430; | |
mov.u32 %r1855, %r16431; | |
mov.u32 %r1854, %r16432; | |
mov.u32 %r1853, %r16433; | |
mov.u32 %r1852, %r16434; | |
mov.u32 %r1851, %r16435; | |
mov.u32 %r1850, %r16436; | |
setp.le.u32 %p242, %r16389, %r1857; | |
mov.u32 %r16397, %r1857; | |
mov.u32 %r16398, %r1856; | |
mov.u32 %r16399, %r1855; | |
mov.u32 %r16400, %r1854; | |
mov.u32 %r16401, %r1853; | |
mov.u32 %r16402, %r1852; | |
mov.u32 %r16403, %r1851; | |
mov.u32 %r16404, %r1850; | |
@%p242 bra BB12_480; | |
st.local.v4.u32 [%rd2+896], {%r1857, %r1856, %r1855, %r1854}; | |
st.local.v4.u32 [%rd2+928], {%r16389, %r16390, %r16391, %r16392}; | |
st.local.v4.u32 [%rd2+912], {%r1853, %r1852, %r1851, %r1850}; | |
st.local.v4.u32 [%rd2+944], {%r16393, %r16394, %r16395, %r16396}; | |
mov.u32 %r15182, %r16396; | |
mov.u32 %r15184, %r16395; | |
mov.u32 %r15186, %r16394; | |
mov.u32 %r15188, %r16393; | |
mov.u32 %r15190, %r16392; | |
mov.u32 %r15192, %r16391; | |
mov.u32 %r15194, %r16390; | |
mov.u32 %r15196, %r16389; | |
mov.u32 %r16396, %r1850; | |
mov.u32 %r16395, %r1851; | |
mov.u32 %r16394, %r1852; | |
mov.u32 %r16393, %r1853; | |
mov.u32 %r16392, %r1854; | |
mov.u32 %r16391, %r1855; | |
mov.u32 %r16390, %r1856; | |
mov.u32 %r16389, %r1857; | |
mov.u32 %r16397, %r15196; | |
mov.u32 %r16398, %r15194; | |
mov.u32 %r16399, %r15192; | |
mov.u32 %r16400, %r15190; | |
mov.u32 %r16401, %r15188; | |
mov.u32 %r16402, %r15186; | |
mov.u32 %r16403, %r15184; | |
mov.u32 %r16404, %r15182; | |
BB12_480: | |
mov.u32 %r16357, %r16389; | |
mov.u32 %r16358, %r16390; | |
mov.u32 %r16359, %r16391; | |
mov.u32 %r16360, %r16392; | |
mov.u32 %r16361, %r16393; | |
mov.u32 %r16362, %r16394; | |
mov.u32 %r16363, %r16395; | |
mov.u32 %r16364, %r16396; | |
mov.u32 %r16365, %r16397; | |
mov.u32 %r16366, %r16398; | |
mov.u32 %r16367, %r16399; | |
mov.u32 %r16368, %r16400; | |
mov.u32 %r16369, %r16401; | |
mov.u32 %r16370, %r16402; | |
mov.u32 %r16371, %r16403; | |
mov.u32 %r16372, %r16404; | |
mul.lo.s64 %rd2129, %rd127, 1792; | |
add.s64 %rd2130, %rd4, %rd2129; | |
bfe.u32 %r7040, %r1786, 22, 6; | |
mul.wide.u32 %rd2131, %r7040, 28; | |
add.s64 %rd2132, %rd2130, %rd2131; | |
ld.global.u32 %r1874, [%rd2132+-8]; | |
and.b32 %r7041, %r1874, 65535; | |
mul.wide.u32 %rd2133, %r7041, 1792; | |
add.s64 %rd2134, %rd6, %rd2133; | |
bfe.u32 %r7042, %r1874, 16, 6; | |
mul.wide.u32 %rd2135, %r7042, 28; | |
add.s64 %rd2136, %rd2134, %rd2135; | |
ld.global.u32 %r1875, [%rd2136+-8]; | |
and.b32 %r7043, %r1875, 65535; | |
mul.wide.u32 %rd2137, %r7043, 1792; | |
add.s64 %rd2138, %rd4, %rd2137; | |
cvt.u64.u32 %rd135, %r7041; | |
cvt.u64.u32 %rd136, %r7043; | |
bfe.u32 %r7044, %r1875, 16, 6; | |
mul.wide.u32 %rd2139, %r7044, 28; | |
add.s64 %rd2140, %rd2138, %rd2139; | |
ld.global.u32 %r1876, [%rd2140+-12]; | |
and.b32 %r7045, %r1876, 65535; | |
cvt.u64.u32 %rd137, %r7045; | |
bfe.u32 %r7046, %r1876, 16, 6; | |
mul.wide.u32 %rd2141, %r7045, 1792; | |
add.s64 %rd2142, %rd415, %rd2141; | |
mul.wide.u32 %rd2143, %r7046, 28; | |
add.s64 %rd2144, %rd2142, %rd2143; | |
ld.global.u32 %r7047, [%rd2144]; | |
and.b32 %r7048, %r7047, 65535; | |
bfe.u32 %r7049, %r7047, 16, 6; | |
mul.wide.u32 %rd2145, %r7048, 1792; | |
add.s64 %rd2146, %rd414, %rd2145; | |
mul.wide.u32 %rd2147, %r7049, 28; | |
add.s64 %rd2148, %rd2146, %rd2147; | |
ld.global.u32 %r7050, [%rd2148]; | |
and.b32 %r7051, %r7050, 65535; | |
shl.b32 %r7052, %r7051, 6; | |
bfe.u32 %r7053, %r7050, 16, 6; | |
or.b32 %r1877, %r7052, %r7053; | |
st.local.u32 [%rd2+960], %r1877; | |
bfe.u32 %r7054, %r7047, 22, 6; | |
mul.wide.u32 %rd2149, %r7054, 28; | |
add.s64 %rd2150, %rd2146, %rd2149; | |
ld.global.u32 %r7055, [%rd2150]; | |
and.b32 %r7056, %r7055, 65535; | |
shl.b32 %r7057, %r7056, 6; | |
bfe.u32 %r7058, %r7055, 16, 6; | |
or.b32 %r16482, %r7057, %r7058; | |
st.local.u32 [%rd2+964], %r16482; | |
setp.le.u32 %p243, %r1877, %r16482; | |
mov.u32 %r16481, %r1877; | |
@%p243 bra BB12_482; | |
st.local.v2.u32 [%rd2+960], {%r16482, %r1877}; | |
mov.u32 %r15285, %r16482; | |
mov.u32 %r16482, %r1877; | |
mov.u32 %r16481, %r15285; | |
BB12_482: | |
mov.u32 %r16477, %r16481; | |
mov.u32 %r16478, %r16482; | |
bfe.u32 %r7059, %r1876, 22, 6; | |
mul.lo.s64 %rd2151, %rd137, 1792; | |
add.s64 %rd2152, %rd415, %rd2151; | |
mul.wide.u32 %rd2153, %r7059, 28; | |
add.s64 %rd2154, %rd2152, %rd2153; | |
ld.global.u32 %r7060, [%rd2154]; | |
and.b32 %r7061, %r7060, 65535; | |
bfe.u32 %r7062, %r7060, 16, 6; | |
mul.wide.u32 %rd2155, %r7061, 1792; | |
add.s64 %rd2156, %rd414, %rd2155; | |
mul.wide.u32 %rd2157, %r7062, 28; | |
add.s64 %rd2158, %rd2156, %rd2157; | |
ld.global.u32 %r7063, [%rd2158]; | |
and.b32 %r7064, %r7063, 65535; | |
shl.b32 %r7065, %r7064, 6; | |
bfe.u32 %r7066, %r7063, 16, 6; | |
or.b32 %r1881, %r7065, %r7066; | |
st.local.u32 [%rd2+968], %r1881; | |
bfe.u32 %r7067, %r7060, 22, 6; | |
mul.wide.u32 %rd2159, %r7067, 28; | |
add.s64 %rd2160, %rd2156, %rd2159; | |
ld.global.u32 %r7068, [%rd2160]; | |
and.b32 %r7069, %r7068, 65535; | |
shl.b32 %r7070, %r7069, 6; | |
bfe.u32 %r7071, %r7068, 16, 6; | |
or.b32 %r16484, %r7070, %r7071; | |
st.local.u32 [%rd2+972], %r16484; | |
setp.le.u32 %p244, %r1881, %r16484; | |
mov.u32 %r16483, %r1881; | |
@%p244 bra BB12_484; | |
st.local.v2.u32 [%rd2+968], {%r16484, %r1881}; | |
mov.u32 %r15291, %r16484; | |
mov.u32 %r16484, %r1881; | |
mov.u32 %r16483, %r15291; | |
BB12_484: | |
mov.u32 %r1884, %r16483; | |
mov.u32 %r1883, %r16484; | |
setp.le.u32 %p245, %r16477, %r1884; | |
mov.u32 %r16479, %r1884; | |
mov.u32 %r16480, %r1883; | |
@%p245 bra BB12_486; | |
st.local.v4.u32 [%rd2+960], {%r1884, %r1883, %r16477, %r16478}; | |
mov.u32 %r15288, %r16478; | |
mov.u32 %r15290, %r16477; | |
mov.u32 %r16478, %r1883; | |
mov.u32 %r16477, %r1884; | |
mov.u32 %r16479, %r15290; | |
mov.u32 %r16480, %r15288; | |
BB12_486: | |
mov.u32 %r16469, %r16477; | |
mov.u32 %r16470, %r16478; | |
mov.u32 %r16471, %r16479; | |
mov.u32 %r16472, %r16480; | |
mul.lo.s64 %rd2161, %rd136, 1792; | |
add.s64 %rd2162, %rd4, %rd2161; | |
bfe.u32 %r7072, %r1875, 22, 6; | |
mul.wide.u32 %rd2163, %r7072, 28; | |
add.s64 %rd2164, %rd2162, %rd2163; | |
ld.global.u32 %r1889, [%rd2164+-12]; | |
and.b32 %r7073, %r1889, 65535; | |
cvt.u64.u32 %rd138, %r7073; | |
bfe.u32 %r7074, %r1889, 16, 6; | |
mul.wide.u32 %rd2165, %r7073, 1792; | |
add.s64 %rd2166, %rd415, %rd2165; | |
mul.wide.u32 %rd2167, %r7074, 28; | |
add.s64 %rd2168, %rd2166, %rd2167; | |
ld.global.u32 %r7075, [%rd2168]; | |
and.b32 %r7076, %r7075, 65535; | |
bfe.u32 %r7077, %r7075, 16, 6; | |
mul.wide.u32 %rd2169, %r7076, 1792; | |
add.s64 %rd2170, %rd414, %rd2169; | |
mul.wide.u32 %rd2171, %r7077, 28; | |
add.s64 %rd2172, %rd2170, %rd2171; | |
ld.global.u32 %r7078, [%rd2172]; | |
and.b32 %r7079, %r7078, 65535; | |
shl.b32 %r7080, %r7079, 6; | |
bfe.u32 %r7081, %r7078, 16, 6; | |
or.b32 %r1890, %r7080, %r7081; | |
st.local.u32 [%rd2+976], %r1890; | |
bfe.u32 %r7082, %r7075, 22, 6; | |
mul.wide.u32 %rd2173, %r7082, 28; | |
add.s64 %rd2174, %rd2170, %rd2173; | |
ld.global.u32 %r7083, [%rd2174]; | |
and.b32 %r7084, %r7083, 65535; | |
shl.b32 %r7085, %r7084, 6; | |
bfe.u32 %r7086, %r7083, 16, 6; | |
or.b32 %r16490, %r7085, %r7086; | |
st.local.u32 [%rd2+980], %r16490; | |
setp.le.u32 %p246, %r1890, %r16490; | |
mov.u32 %r16489, %r1890; | |
@%p246 bra BB12_488; | |
st.local.v2.u32 [%rd2+976], {%r16490, %r1890}; | |
mov.u32 %r15305, %r16490; | |
mov.u32 %r16490, %r1890; | |
mov.u32 %r16489, %r15305; | |
BB12_488: | |
mov.u32 %r16485, %r16489; | |
mov.u32 %r16486, %r16490; | |
bfe.u32 %r7087, %r1889, 22, 6; | |
mul.lo.s64 %rd2175, %rd138, 1792; | |
add.s64 %rd2176, %rd415, %rd2175; | |
mul.wide.u32 %rd2177, %r7087, 28; | |
add.s64 %rd2178, %rd2176, %rd2177; | |
ld.global.u32 %r7088, [%rd2178]; | |
and.b32 %r7089, %r7088, 65535; | |
bfe.u32 %r7090, %r7088, 16, 6; | |
mul.wide.u32 %rd2179, %r7089, 1792; | |
add.s64 %rd2180, %rd414, %rd2179; | |
mul.wide.u32 %rd2181, %r7090, 28; | |
add.s64 %rd2182, %rd2180, %rd2181; | |
ld.global.u32 %r7091, [%rd2182]; | |
and.b32 %r7092, %r7091, 65535; | |
shl.b32 %r7093, %r7092, 6; | |
bfe.u32 %r7094, %r7091, 16, 6; | |
or.b32 %r1894, %r7093, %r7094; | |
st.local.u32 [%rd2+984], %r1894; | |
bfe.u32 %r7095, %r7088, 22, 6; | |
mul.wide.u32 %rd2183, %r7095, 28; | |
add.s64 %rd2184, %rd2180, %rd2183; | |
ld.global.u32 %r7096, [%rd2184]; | |
and.b32 %r7097, %r7096, 65535; | |
shl.b32 %r7098, %r7097, 6; | |
bfe.u32 %r7099, %r7096, 16, 6; | |
or.b32 %r16492, %r7098, %r7099; | |
st.local.u32 [%rd2+988], %r16492; | |
setp.le.u32 %p247, %r1894, %r16492; | |
mov.u32 %r16491, %r1894; | |
@%p247 bra BB12_490; | |
st.local.v2.u32 [%rd2+984], {%r16492, %r1894}; | |
mov.u32 %r15311, %r16492; | |
mov.u32 %r16492, %r1894; | |
mov.u32 %r16491, %r15311; | |
BB12_490: | |
mov.u32 %r1897, %r16491; | |
mov.u32 %r1896, %r16492; | |
setp.le.u32 %p248, %r16485, %r1897; | |
mov.u32 %r16487, %r1897; | |
mov.u32 %r16488, %r1896; | |
@%p248 bra BB12_492; | |
st.local.v4.u32 [%rd2+976], {%r1897, %r1896, %r16485, %r16486}; | |
mov.u32 %r15308, %r16486; | |
mov.u32 %r15310, %r16485; | |
mov.u32 %r16486, %r1896; | |
mov.u32 %r16485, %r1897; | |
mov.u32 %r16487, %r15310; | |
mov.u32 %r16488, %r15308; | |
BB12_492: | |
mov.u32 %r1901, %r16485; | |
mov.u32 %r1900, %r16486; | |
mov.u32 %r1899, %r16487; | |
mov.u32 %r1898, %r16488; | |
setp.le.u32 %p249, %r16469, %r1901; | |
mov.u32 %r16473, %r1901; | |
mov.u32 %r16474, %r1900; | |
mov.u32 %r16475, %r1899; | |
mov.u32 %r16476, %r1898; | |
@%p249 bra BB12_494; | |
st.local.v4.u32 [%rd2+960], {%r1901, %r1900, %r1899, %r1898}; | |
st.local.v4.u32 [%rd2+976], {%r16469, %r16470, %r16471, %r16472}; | |
mov.u32 %r15298, %r16472; | |
mov.u32 %r15300, %r16471; | |
mov.u32 %r15302, %r16470; | |
mov.u32 %r15304, %r16469; | |
mov.u32 %r16472, %r1898; | |
mov.u32 %r16471, %r1899; | |
mov.u32 %r16470, %r1900; | |
mov.u32 %r16469, %r1901; | |
mov.u32 %r16473, %r15304; | |
mov.u32 %r16474, %r15302; | |
mov.u32 %r16475, %r15300; | |
mov.u32 %r16476, %r15298; | |
BB12_494: | |
mov.u32 %r16453, %r16469; | |
mov.u32 %r16454, %r16470; | |
mov.u32 %r16455, %r16471; | |
mov.u32 %r16456, %r16472; | |
mov.u32 %r16457, %r16473; | |
mov.u32 %r16458, %r16474; | |
mov.u32 %r16459, %r16475; | |
mov.u32 %r16460, %r16476; | |
mul.lo.s64 %rd2185, %rd135, 1792; | |
add.s64 %rd2186, %rd6, %rd2185; | |
bfe.u32 %r7100, %r1874, 22, 6; | |
mul.wide.u32 %rd2187, %r7100, 28; | |
add.s64 %rd2188, %rd2186, %rd2187; | |
ld.global.u32 %r1910, [%rd2188+-8]; | |
and.b32 %r7101, %r1910, 65535; | |
mul.wide.u32 %rd2189, %r7101, 1792; | |
add.s64 %rd2190, %rd4, %rd2189; | |
cvt.u64.u32 %rd139, %r7101; | |
bfe.u32 %r7102, %r1910, 16, 6; | |
mul.wide.u32 %rd2191, %r7102, 28; | |
add.s64 %rd2192, %rd2190, %rd2191; | |
ld.global.u32 %r1911, [%rd2192+-12]; | |
and.b32 %r7103, %r1911, 65535; | |
cvt.u64.u32 %rd140, %r7103; | |
bfe.u32 %r7104, %r1911, 16, 6; | |
mul.wide.u32 %rd2193, %r7103, 1792; | |
add.s64 %rd2194, %rd415, %rd2193; | |
mul.wide.u32 %rd2195, %r7104, 28; | |
add.s64 %rd2196, %rd2194, %rd2195; | |
ld.global.u32 %r7105, [%rd2196]; | |
and.b32 %r7106, %r7105, 65535; | |
bfe.u32 %r7107, %r7105, 16, 6; | |
mul.wide.u32 %rd2197, %r7106, 1792; | |
add.s64 %rd2198, %rd414, %rd2197; | |
mul.wide.u32 %rd2199, %r7107, 28; | |
add.s64 %rd2200, %rd2198, %rd2199; | |
ld.global.u32 %r7108, [%rd2200]; | |
and.b32 %r7109, %r7108, 65535; | |
shl.b32 %r7110, %r7109, 6; | |
bfe.u32 %r7111, %r7108, 16, 6; | |
or.b32 %r1912, %r7110, %r7111; | |
st.local.u32 [%rd2+992], %r1912; | |
bfe.u32 %r7112, %r7105, 22, 6; | |
mul.wide.u32 %rd2201, %r7112, 28; | |
add.s64 %rd2202, %rd2198, %rd2201; | |
ld.global.u32 %r7113, [%rd2202]; | |
and.b32 %r7114, %r7113, 65535; | |
shl.b32 %r7115, %r7114, 6; | |
bfe.u32 %r7116, %r7113, 16, 6; | |
or.b32 %r16506, %r7115, %r7116; | |
st.local.u32 [%rd2+996], %r16506; | |
setp.le.u32 %p250, %r1912, %r16506; | |
mov.u32 %r16505, %r1912; | |
@%p250 bra BB12_496; | |
st.local.v2.u32 [%rd2+992], {%r16506, %r1912}; | |
mov.u32 %r15341, %r16506; | |
mov.u32 %r16506, %r1912; | |
mov.u32 %r16505, %r15341; | |
BB12_496: | |
mov.u32 %r16501, %r16505; | |
mov.u32 %r16502, %r16506; | |
bfe.u32 %r7117, %r1911, 22, 6; | |
mul.lo.s64 %rd2203, %rd140, 1792; | |
add.s64 %rd2204, %rd415, %rd2203; | |
mul.wide.u32 %rd2205, %r7117, 28; | |
add.s64 %rd2206, %rd2204, %rd2205; | |
ld.global.u32 %r7118, [%rd2206]; | |
and.b32 %r7119, %r7118, 65535; | |
bfe.u32 %r7120, %r7118, 16, 6; | |
mul.wide.u32 %rd2207, %r7119, 1792; | |
add.s64 %rd2208, %rd414, %rd2207; | |
mul.wide.u32 %rd2209, %r7120, 28; | |
add.s64 %rd2210, %rd2208, %rd2209; | |
ld.global.u32 %r7121, [%rd2210]; | |
and.b32 %r7122, %r7121, 65535; | |
shl.b32 %r7123, %r7122, 6; | |
bfe.u32 %r7124, %r7121, 16, 6; | |
or.b32 %r1916, %r7123, %r7124; | |
st.local.u32 [%rd2+1000], %r1916; | |
bfe.u32 %r7125, %r7118, 22, 6; | |
mul.wide.u32 %rd2211, %r7125, 28; | |
add.s64 %rd2212, %rd2208, %rd2211; | |
ld.global.u32 %r7126, [%rd2212]; | |
and.b32 %r7127, %r7126, 65535; | |
shl.b32 %r7128, %r7127, 6; | |
bfe.u32 %r7129, %r7126, 16, 6; | |
or.b32 %r16508, %r7128, %r7129; | |
st.local.u32 [%rd2+1004], %r16508; | |
setp.le.u32 %p251, %r1916, %r16508; | |
mov.u32 %r16507, %r1916; | |
@%p251 bra BB12_498; | |
st.local.v2.u32 [%rd2+1000], {%r16508, %r1916}; | |
mov.u32 %r15347, %r16508; | |
mov.u32 %r16508, %r1916; | |
mov.u32 %r16507, %r15347; | |
BB12_498: | |
mov.u32 %r1919, %r16507; | |
mov.u32 %r1918, %r16508; | |
setp.le.u32 %p252, %r16501, %r1919; | |
mov.u32 %r16503, %r1919; | |
mov.u32 %r16504, %r1918; | |
@%p252 bra BB12_500; | |
st.local.v4.u32 [%rd2+992], {%r1919, %r1918, %r16501, %r16502}; | |
mov.u32 %r15344, %r16502; | |
mov.u32 %r15346, %r16501; | |
mov.u32 %r16502, %r1918; | |
mov.u32 %r16501, %r1919; | |
mov.u32 %r16503, %r15346; | |
mov.u32 %r16504, %r15344; | |
BB12_500: | |
mov.u32 %r16493, %r16501; | |
mov.u32 %r16494, %r16502; | |
mov.u32 %r16495, %r16503; | |
mov.u32 %r16496, %r16504; | |
mul.lo.s64 %rd2213, %rd139, 1792; | |
add.s64 %rd2214, %rd4, %rd2213; | |
bfe.u32 %r7130, %r1910, 22, 6; | |
mul.wide.u32 %rd2215, %r7130, 28; | |
add.s64 %rd2216, %rd2214, %rd2215; | |
ld.global.u32 %r1924, [%rd2216+-12]; | |
and.b32 %r7131, %r1924, 65535; | |
cvt.u64.u32 %rd141, %r7131; | |
bfe.u32 %r7132, %r1924, 16, 6; | |
mul.wide.u32 %rd2217, %r7131, 1792; | |
add.s64 %rd2218, %rd415, %rd2217; | |
mul.wide.u32 %rd2219, %r7132, 28; | |
add.s64 %rd2220, %rd2218, %rd2219; | |
ld.global.u32 %r7133, [%rd2220]; | |
and.b32 %r7134, %r7133, 65535; | |
bfe.u32 %r7135, %r7133, 16, 6; | |
mul.wide.u32 %rd2221, %r7134, 1792; | |
add.s64 %rd2222, %rd414, %rd2221; | |
mul.wide.u32 %rd2223, %r7135, 28; | |
add.s64 %rd2224, %rd2222, %rd2223; | |
ld.global.u32 %r7136, [%rd2224]; | |
and.b32 %r7137, %r7136, 65535; | |
shl.b32 %r7138, %r7137, 6; | |
bfe.u32 %r7139, %r7136, 16, 6; | |
or.b32 %r1925, %r7138, %r7139; | |
st.local.u32 [%rd2+1008], %r1925; | |
bfe.u32 %r7140, %r7133, 22, 6; | |
mul.wide.u32 %rd2225, %r7140, 28; | |
add.s64 %rd2226, %rd2222, %rd2225; | |
ld.global.u32 %r7141, [%rd2226]; | |
and.b32 %r7142, %r7141, 65535; | |
shl.b32 %r7143, %r7142, 6; | |
bfe.u32 %r7144, %r7141, 16, 6; | |
or.b32 %r16514, %r7143, %r7144; | |
st.local.u32 [%rd2+1012], %r16514; | |
setp.le.u32 %p253, %r1925, %r16514; | |
mov.u32 %r16513, %r1925; | |
@%p253 bra BB12_502; | |
st.local.v2.u32 [%rd2+1008], {%r16514, %r1925}; | |
mov.u32 %r15361, %r16514; | |
mov.u32 %r16514, %r1925; | |
mov.u32 %r16513, %r15361; | |
BB12_502: | |
mov.u32 %r16509, %r16513; | |
mov.u32 %r16510, %r16514; | |
bfe.u32 %r7145, %r1924, 22, 6; | |
mul.lo.s64 %rd2227, %rd141, 1792; | |
add.s64 %rd2228, %rd415, %rd2227; | |
mul.wide.u32 %rd2229, %r7145, 28; | |
add.s64 %rd2230, %rd2228, %rd2229; | |
ld.global.u32 %r7146, [%rd2230]; | |
and.b32 %r7147, %r7146, 65535; | |
bfe.u32 %r7148, %r7146, 16, 6; | |
mul.wide.u32 %rd2231, %r7147, 1792; | |
add.s64 %rd2232, %rd414, %rd2231; | |
mul.wide.u32 %rd2233, %r7148, 28; | |
add.s64 %rd2234, %rd2232, %rd2233; | |
ld.global.u32 %r7149, [%rd2234]; | |
and.b32 %r7150, %r7149, 65535; | |
shl.b32 %r7151, %r7150, 6; | |
bfe.u32 %r7152, %r7149, 16, 6; | |
or.b32 %r1929, %r7151, %r7152; | |
st.local.u32 [%rd2+1016], %r1929; | |
bfe.u32 %r7153, %r7146, 22, 6; | |
mul.wide.u32 %rd2235, %r7153, 28; | |
add.s64 %rd2236, %rd2232, %rd2235; | |
ld.global.u32 %r7154, [%rd2236]; | |
and.b32 %r7155, %r7154, 65535; | |
shl.b32 %r7156, %r7155, 6; | |
bfe.u32 %r7157, %r7154, 16, 6; | |
or.b32 %r16516, %r7156, %r7157; | |
st.local.u32 [%rd2+1020], %r16516; | |
setp.le.u32 %p254, %r1929, %r16516; | |
mov.u32 %r16515, %r1929; | |
@%p254 bra BB12_504; | |
st.local.v2.u32 [%rd2+1016], {%r16516, %r1929}; | |
mov.u32 %r15367, %r16516; | |
mov.u32 %r16516, %r1929; | |
mov.u32 %r16515, %r15367; | |
BB12_504: | |
mov.u32 %r1932, %r16515; | |
mov.u32 %r1931, %r16516; | |
setp.le.u32 %p255, %r16509, %r1932; | |
mov.u32 %r16511, %r1932; | |
mov.u32 %r16512, %r1931; | |
@%p255 bra BB12_506; | |
st.local.v4.u32 [%rd2+1008], {%r1932, %r1931, %r16509, %r16510}; | |
mov.u32 %r15364, %r16510; | |
mov.u32 %r15366, %r16509; | |
mov.u32 %r16510, %r1931; | |
mov.u32 %r16509, %r1932; | |
mov.u32 %r16511, %r15366; | |
mov.u32 %r16512, %r15364; | |
BB12_506: | |
mov.u32 %r1936, %r16509; | |
mov.u32 %r1935, %r16510; | |
mov.u32 %r1934, %r16511; | |
mov.u32 %r1933, %r16512; | |
setp.le.u32 %p256, %r16493, %r1936; | |
mov.u32 %r16497, %r1936; | |
mov.u32 %r16498, %r1935; | |
mov.u32 %r16499, %r1934; | |
mov.u32 %r16500, %r1933; | |
@%p256 bra BB12_508; | |
st.local.v4.u32 [%rd2+992], {%r1936, %r1935, %r1934, %r1933}; | |
st.local.v4.u32 [%rd2+1008], {%r16493, %r16494, %r16495, %r16496}; | |
mov.u32 %r15354, %r16496; | |
mov.u32 %r15356, %r16495; | |
mov.u32 %r15358, %r16494; | |
mov.u32 %r15360, %r16493; | |
mov.u32 %r16496, %r1933; | |
mov.u32 %r16495, %r1934; | |
mov.u32 %r16494, %r1935; | |
mov.u32 %r16493, %r1936; | |
mov.u32 %r16497, %r15360; | |
mov.u32 %r16498, %r15358; | |
mov.u32 %r16499, %r15356; | |
mov.u32 %r16500, %r15354; | |
BB12_508: | |
mov.u32 %r1944, %r16493; | |
mov.u32 %r1943, %r16494; | |
mov.u32 %r1942, %r16495; | |
mov.u32 %r1941, %r16496; | |
mov.u32 %r1940, %r16497; | |
mov.u32 %r1939, %r16498; | |
mov.u32 %r1938, %r16499; | |
mov.u32 %r1937, %r16500; | |
setp.le.u32 %p257, %r16453, %r1944; | |
mov.u32 %r16461, %r1944; | |
mov.u32 %r16462, %r1943; | |
mov.u32 %r16463, %r1942; | |
mov.u32 %r16464, %r1941; | |
mov.u32 %r16465, %r1940; | |
mov.u32 %r16466, %r1939; | |
mov.u32 %r16467, %r1938; | |
mov.u32 %r16468, %r1937; | |
@%p257 bra BB12_510; | |
st.local.v4.u32 [%rd2+960], {%r1944, %r1943, %r1942, %r1941}; | |
st.local.v4.u32 [%rd2+992], {%r16453, %r16454, %r16455, %r16456}; | |
st.local.v4.u32 [%rd2+976], {%r1940, %r1939, %r1938, %r1937}; | |
st.local.v4.u32 [%rd2+1008], {%r16457, %r16458, %r16459, %r16460}; | |
mov.u32 %r15326, %r16460; | |
mov.u32 %r15328, %r16459; | |
mov.u32 %r15330, %r16458; | |
mov.u32 %r15332, %r16457; | |
mov.u32 %r15334, %r16456; | |
mov.u32 %r15336, %r16455; | |
mov.u32 %r15338, %r16454; | |
mov.u32 %r15340, %r16453; | |
mov.u32 %r16460, %r1937; | |
mov.u32 %r16459, %r1938; | |
mov.u32 %r16458, %r1939; | |
mov.u32 %r16457, %r1940; | |
mov.u32 %r16456, %r1941; | |
mov.u32 %r16455, %r1942; | |
mov.u32 %r16454, %r1943; | |
mov.u32 %r16453, %r1944; | |
mov.u32 %r16461, %r15340; | |
mov.u32 %r16462, %r15338; | |
mov.u32 %r16463, %r15336; | |
mov.u32 %r16464, %r15334; | |
mov.u32 %r16465, %r15332; | |
mov.u32 %r16466, %r15330; | |
mov.u32 %r16467, %r15328; | |
mov.u32 %r16468, %r15326; | |
BB12_510: | |
mov.u32 %r1960, %r16453; | |
mov.u32 %r1959, %r16454; | |
mov.u32 %r1958, %r16455; | |
mov.u32 %r1957, %r16456; | |
mov.u32 %r1956, %r16457; | |
mov.u32 %r1955, %r16458; | |
mov.u32 %r1954, %r16459; | |
mov.u32 %r1953, %r16460; | |
mov.u32 %r1952, %r16461; | |
mov.u32 %r1951, %r16462; | |
mov.u32 %r1950, %r16463; | |
mov.u32 %r1949, %r16464; | |
mov.u32 %r1948, %r16465; | |
mov.u32 %r1947, %r16466; | |
mov.u32 %r1946, %r16467; | |
mov.u32 %r1945, %r16468; | |
setp.le.u32 %p258, %r16357, %r1960; | |
mov.u32 %r16373, %r1960; | |
mov.u32 %r16374, %r1959; | |
mov.u32 %r16375, %r1958; | |
mov.u32 %r16376, %r1957; | |
mov.u32 %r16377, %r1956; | |
mov.u32 %r16378, %r1955; | |
mov.u32 %r16379, %r1954; | |
mov.u32 %r16380, %r1953; | |
mov.u32 %r16381, %r1952; | |
mov.u32 %r16382, %r1951; | |
mov.u32 %r16383, %r1950; | |
mov.u32 %r16384, %r1949; | |
mov.u32 %r16385, %r1948; | |
mov.u32 %r16386, %r1947; | |
mov.u32 %r16387, %r1946; | |
mov.u32 %r16388, %r1945; | |
@%p258 bra BB12_512; | |
st.local.v4.u32 [%rd2+896], {%r1960, %r1959, %r1958, %r1957}; | |
st.local.v4.u32 [%rd2+960], {%r16357, %r16358, %r16359, %r16360}; | |
st.local.v4.u32 [%rd2+912], {%r1956, %r1955, %r1954, %r1953}; | |
st.local.v4.u32 [%rd2+976], {%r16361, %r16362, %r16363, %r16364}; | |
st.local.v4.u32 [%rd2+928], {%r1952, %r1951, %r1950, %r1949}; | |
st.local.v4.u32 [%rd2+992], {%r16365, %r16366, %r16367, %r16368}; | |
st.local.v4.u32 [%rd2+944], {%r1948, %r1947, %r1946, %r1945}; | |
st.local.v4.u32 [%rd2+1008], {%r16369, %r16370, %r16371, %r16372}; | |
mov.u32 %r15254, %r16372; | |
mov.u32 %r15256, %r16371; | |
mov.u32 %r15258, %r16370; | |
mov.u32 %r15260, %r16369; | |
mov.u32 %r15262, %r16368; | |
mov.u32 %r15264, %r16367; | |
mov.u32 %r15266, %r16366; | |
mov.u32 %r15268, %r16365; | |
mov.u32 %r15270, %r16364; | |
mov.u32 %r15272, %r16363; | |
mov.u32 %r15274, %r16362; | |
mov.u32 %r15276, %r16361; | |
mov.u32 %r15278, %r16360; | |
mov.u32 %r15280, %r16359; | |
mov.u32 %r15282, %r16358; | |
mov.u32 %r15284, %r16357; | |
mov.u32 %r16372, %r1945; | |
mov.u32 %r16371, %r1946; | |
mov.u32 %r16370, %r1947; | |
mov.u32 %r16369, %r1948; | |
mov.u32 %r16368, %r1949; | |
mov.u32 %r16367, %r1950; | |
mov.u32 %r16366, %r1951; | |
mov.u32 %r16365, %r1952; | |
mov.u32 %r16364, %r1953; | |
mov.u32 %r16363, %r1954; | |
mov.u32 %r16362, %r1955; | |
mov.u32 %r16361, %r1956; | |
mov.u32 %r16360, %r1957; | |
mov.u32 %r16359, %r1958; | |
mov.u32 %r16358, %r1959; | |
mov.u32 %r16357, %r1960; | |
mov.u32 %r16373, %r15284; | |
mov.u32 %r16374, %r15282; | |
mov.u32 %r16375, %r15280; | |
mov.u32 %r16376, %r15278; | |
mov.u32 %r16377, %r15276; | |
mov.u32 %r16378, %r15274; | |
mov.u32 %r16379, %r15272; | |
mov.u32 %r16380, %r15270; | |
mov.u32 %r16381, %r15268; | |
mov.u32 %r16382, %r15266; | |
mov.u32 %r16383, %r15264; | |
mov.u32 %r16384, %r15262; | |
mov.u32 %r16385, %r15260; | |
mov.u32 %r16386, %r15258; | |
mov.u32 %r16387, %r15256; | |
mov.u32 %r16388, %r15254; | |
BB12_512: | |
mov.u32 %r1992, %r16357; | |
mov.u32 %r1991, %r16358; | |
mov.u32 %r1990, %r16359; | |
mov.u32 %r1989, %r16360; | |
mov.u32 %r1988, %r16361; | |
mov.u32 %r1987, %r16362; | |
mov.u32 %r1986, %r16363; | |
mov.u32 %r1985, %r16364; | |
mov.u32 %r1984, %r16365; | |
mov.u32 %r1983, %r16366; | |
mov.u32 %r1982, %r16367; | |
mov.u32 %r1981, %r16368; | |
mov.u32 %r1980, %r16369; | |
mov.u32 %r1979, %r16370; | |
mov.u32 %r1978, %r16371; | |
mov.u32 %r1977, %r16372; | |
mov.u32 %r1976, %r16373; | |
mov.u32 %r1975, %r16374; | |
mov.u32 %r1974, %r16375; | |
mov.u32 %r1973, %r16376; | |
mov.u32 %r1972, %r16377; | |
mov.u32 %r1971, %r16378; | |
mov.u32 %r1970, %r16379; | |
mov.u32 %r1969, %r16380; | |
mov.u32 %r1968, %r16381; | |
mov.u32 %r1967, %r16382; | |
mov.u32 %r1966, %r16383; | |
mov.u32 %r1965, %r16384; | |
mov.u32 %r1964, %r16385; | |
mov.u32 %r1963, %r16386; | |
mov.u32 %r1962, %r16387; | |
mov.u32 %r1961, %r16388; | |
setp.le.u32 %p259, %r16133, %r1992; | |
mov.u32 %r16165, %r1992; | |
mov.u32 %r16166, %r1991; | |
mov.u32 %r16167, %r1990; | |
mov.u32 %r16168, %r1989; | |
mov.u32 %r16169, %r1988; | |
mov.u32 %r16170, %r1987; | |
mov.u32 %r16171, %r1986; | |
mov.u32 %r16172, %r1985; | |
mov.u32 %r16173, %r1984; | |
mov.u32 %r16174, %r1983; | |
mov.u32 %r16175, %r1982; | |
mov.u32 %r16176, %r1981; | |
mov.u32 %r16177, %r1980; | |
mov.u32 %r16178, %r1979; | |
mov.u32 %r16179, %r1978; | |
mov.u32 %r16180, %r1977; | |
mov.u32 %r16181, %r1976; | |
mov.u32 %r16182, %r1975; | |
mov.u32 %r16183, %r1974; | |
mov.u32 %r16184, %r1973; | |
mov.u32 %r16185, %r1972; | |
mov.u32 %r16186, %r1971; | |
mov.u32 %r16187, %r1970; | |
mov.u32 %r16188, %r1969; | |
mov.u32 %r16189, %r1968; | |
mov.u32 %r16190, %r1967; | |
mov.u32 %r16191, %r1966; | |
mov.u32 %r16192, %r1965; | |
mov.u32 %r16193, %r1964; | |
mov.u32 %r16194, %r1963; | |
mov.u32 %r16195, %r1962; | |
mov.u32 %r16196, %r1961; | |
@%p259 bra BB12_514; | |
st.local.v4.u32 [%rd2+768], {%r1992, %r1991, %r1990, %r1989}; | |
st.local.v4.u32 [%rd2+896], {%r16133, %r16134, %r16135, %r16136}; | |
st.local.v4.u32 [%rd2+784], {%r1988, %r1987, %r1986, %r1985}; | |
st.local.v4.u32 [%rd2+912], {%r16137, %r16138, %r16139, %r16140}; | |
st.local.v4.u32 [%rd2+800], {%r1984, %r1983, %r1982, %r1981}; | |
st.local.v4.u32 [%rd2+928], {%r16141, %r16142, %r16143, %r16144}; | |
st.local.v4.u32 [%rd2+816], {%r1980, %r1979, %r1978, %r1977}; | |
st.local.v4.u32 [%rd2+944], {%r16145, %r16146, %r16147, %r16148}; | |
st.local.v4.u32 [%rd2+832], {%r1976, %r1975, %r1974, %r1973}; | |
st.local.v4.u32 [%rd2+960], {%r16149, %r16150, %r16151, %r16152}; | |
st.local.v4.u32 [%rd2+848], {%r1972, %r1971, %r1970, %r1969}; | |
st.local.v4.u32 [%rd2+976], {%r16153, %r16154, %r16155, %r16156}; | |
st.local.v4.u32 [%rd2+864], {%r1968, %r1967, %r1966, %r1965}; | |
st.local.v4.u32 [%rd2+992], {%r16157, %r16158, %r16159, %r16160}; | |
st.local.v4.u32 [%rd2+880], {%r1964, %r1963, %r1962, %r1961}; | |
st.local.v4.u32 [%rd2+1008], {%r16161, %r16162, %r16163, %r16164}; | |
mov.u32 %r15078, %r16164; | |
mov.u32 %r15080, %r16163; | |
mov.u32 %r15082, %r16162; | |
mov.u32 %r15084, %r16161; | |
mov.u32 %r15086, %r16160; | |
mov.u32 %r15088, %r16159; | |
mov.u32 %r15090, %r16158; | |
mov.u32 %r15092, %r16157; | |
mov.u32 %r15094, %r16156; | |
mov.u32 %r15096, %r16155; | |
mov.u32 %r15098, %r16154; | |
mov.u32 %r15100, %r16153; | |
mov.u32 %r15102, %r16152; | |
mov.u32 %r15104, %r16151; | |
mov.u32 %r15106, %r16150; | |
mov.u32 %r15108, %r16149; | |
mov.u32 %r15110, %r16148; | |
mov.u32 %r15112, %r16147; | |
mov.u32 %r15114, %r16146; | |
mov.u32 %r15116, %r16145; | |
mov.u32 %r15118, %r16144; | |
mov.u32 %r15120, %r16143; | |
mov.u32 %r15122, %r16142; | |
mov.u32 %r15124, %r16141; | |
mov.u32 %r15126, %r16140; | |
mov.u32 %r15128, %r16139; | |
mov.u32 %r15130, %r16138; | |
mov.u32 %r15132, %r16137; | |
mov.u32 %r15134, %r16136; | |
mov.u32 %r15136, %r16135; | |
mov.u32 %r15138, %r16134; | |
mov.u32 %r15140, %r16133; | |
mov.u32 %r16164, %r1961; | |
mov.u32 %r16163, %r1962; | |
mov.u32 %r16162, %r1963; | |
mov.u32 %r16161, %r1964; | |
mov.u32 %r16160, %r1965; | |
mov.u32 %r16159, %r1966; | |
mov.u32 %r16158, %r1967; | |
mov.u32 %r16157, %r1968; | |
mov.u32 %r16156, %r1969; | |
mov.u32 %r16155, %r1970; | |
mov.u32 %r16154, %r1971; | |
mov.u32 %r16153, %r1972; | |
mov.u32 %r16152, %r1973; | |
mov.u32 %r16151, %r1974; | |
mov.u32 %r16150, %r1975; | |
mov.u32 %r16149, %r1976; | |
mov.u32 %r16148, %r1977; | |
mov.u32 %r16147, %r1978; | |
mov.u32 %r16146, %r1979; | |
mov.u32 %r16145, %r1980; | |
mov.u32 %r16144, %r1981; | |
mov.u32 %r16143, %r1982; | |
mov.u32 %r16142, %r1983; | |
mov.u32 %r16141, %r1984; | |
mov.u32 %r16140, %r1985; | |
mov.u32 %r16139, %r1986; | |
mov.u32 %r16138, %r1987; | |
mov.u32 %r16137, %r1988; | |
mov.u32 %r16136, %r1989; | |
mov.u32 %r16135, %r1990; | |
mov.u32 %r16134, %r1991; | |
mov.u32 %r16133, %r1992; | |
mov.u32 %r16165, %r15140; | |
mov.u32 %r16166, %r15138; | |
mov.u32 %r16167, %r15136; | |
mov.u32 %r16168, %r15134; | |
mov.u32 %r16169, %r15132; | |
mov.u32 %r16170, %r15130; | |
mov.u32 %r16171, %r15128; | |
mov.u32 %r16172, %r15126; | |
mov.u32 %r16173, %r15124; | |
mov.u32 %r16174, %r15122; | |
mov.u32 %r16175, %r15120; | |
mov.u32 %r16176, %r15118; | |
mov.u32 %r16177, %r15116; | |
mov.u32 %r16178, %r15114; | |
mov.u32 %r16179, %r15112; | |
mov.u32 %r16180, %r15110; | |
mov.u32 %r16181, %r15108; | |
mov.u32 %r16182, %r15106; | |
mov.u32 %r16183, %r15104; | |
mov.u32 %r16184, %r15102; | |
mov.u32 %r16185, %r15100; | |
mov.u32 %r16186, %r15098; | |
mov.u32 %r16187, %r15096; | |
mov.u32 %r16188, %r15094; | |
mov.u32 %r16189, %r15092; | |
mov.u32 %r16190, %r15090; | |
mov.u32 %r16191, %r15088; | |
mov.u32 %r16192, %r15086; | |
mov.u32 %r16193, %r15084; | |
mov.u32 %r16194, %r15082; | |
mov.u32 %r16195, %r15080; | |
mov.u32 %r16196, %r15078; | |
BB12_514: | |
mov.u32 %r2056, %r16133; | |
mov.u32 %r2055, %r16134; | |
mov.u32 %r2054, %r16135; | |
mov.u32 %r2053, %r16136; | |
mov.u32 %r2052, %r16137; | |
mov.u32 %r2051, %r16138; | |
mov.u32 %r2050, %r16139; | |
mov.u32 %r2049, %r16140; | |
mov.u32 %r2048, %r16141; | |
mov.u32 %r2047, %r16142; | |
mov.u32 %r2046, %r16143; | |
mov.u32 %r2045, %r16144; | |
mov.u32 %r2044, %r16145; | |
mov.u32 %r2043, %r16146; | |
mov.u32 %r2042, %r16147; | |
mov.u32 %r2041, %r16148; | |
mov.u32 %r2040, %r16149; | |
mov.u32 %r2039, %r16150; | |
mov.u32 %r2038, %r16151; | |
mov.u32 %r2037, %r16152; | |
mov.u32 %r2036, %r16153; | |
mov.u32 %r2035, %r16154; | |
mov.u32 %r2034, %r16155; | |
mov.u32 %r2033, %r16156; | |
mov.u32 %r2032, %r16157; | |
mov.u32 %r2031, %r16158; | |
mov.u32 %r2030, %r16159; | |
mov.u32 %r2029, %r16160; | |
mov.u32 %r2028, %r16161; | |
mov.u32 %r2027, %r16162; | |
mov.u32 %r2026, %r16163; | |
mov.u32 %r2025, %r16164; | |
mov.u32 %r2024, %r16165; | |
mov.u32 %r2023, %r16166; | |
mov.u32 %r2022, %r16167; | |
mov.u32 %r2021, %r16168; | |
mov.u32 %r2020, %r16169; | |
mov.u32 %r2019, %r16170; | |
mov.u32 %r2018, %r16171; | |
mov.u32 %r2017, %r16172; | |
mov.u32 %r2016, %r16173; | |
mov.u32 %r2015, %r16174; | |
mov.u32 %r2014, %r16175; | |
mov.u32 %r2013, %r16176; | |
mov.u32 %r2012, %r16177; | |
mov.u32 %r2011, %r16178; | |
mov.u32 %r2010, %r16179; | |
mov.u32 %r2009, %r16180; | |
mov.u32 %r2008, %r16181; | |
mov.u32 %r2007, %r16182; | |
mov.u32 %r2006, %r16183; | |
mov.u32 %r2005, %r16184; | |
mov.u32 %r2004, %r16185; | |
mov.u32 %r2003, %r16186; | |
mov.u32 %r2002, %r16187; | |
mov.u32 %r2001, %r16188; | |
mov.u32 %r2000, %r16189; | |
mov.u32 %r1999, %r16190; | |
mov.u32 %r1998, %r16191; | |
mov.u32 %r1997, %r16192; | |
mov.u32 %r1996, %r16193; | |
mov.u32 %r1995, %r16194; | |
mov.u32 %r1994, %r16195; | |
mov.u32 %r1993, %r16196; | |
setp.le.u32 %p260, %r15621, %r2056; | |
mov.u32 %r15685, %r2056; | |
mov.u32 %r15686, %r2055; | |
mov.u32 %r15687, %r2054; | |
mov.u32 %r15688, %r2053; | |
mov.u32 %r15689, %r2052; | |
mov.u32 %r15690, %r2051; | |
mov.u32 %r15691, %r2050; | |
mov.u32 %r15692, %r2049; | |
mov.u32 %r15693, %r2048; | |
mov.u32 %r15694, %r2047; | |
mov.u32 %r15695, %r2046; | |
mov.u32 %r15696, %r2045; | |
mov.u32 %r15697, %r2044; | |
mov.u32 %r15698, %r2043; | |
mov.u32 %r15699, %r2042; | |
mov.u32 %r15700, %r2041; | |
mov.u32 %r15701, %r2040; | |
mov.u32 %r15702, %r2039; | |
mov.u32 %r15703, %r2038; | |
mov.u32 %r15704, %r2037; | |
mov.u32 %r15705, %r2036; | |
mov.u32 %r15706, %r2035; | |
mov.u32 %r15707, %r2034; | |
mov.u32 %r15708, %r2033; | |
mov.u32 %r15709, %r2032; | |
mov.u32 %r15710, %r2031; | |
mov.u32 %r15711, %r2030; | |
mov.u32 %r15712, %r2029; | |
mov.u32 %r15713, %r2028; | |
mov.u32 %r15714, %r2027; | |
mov.u32 %r15715, %r2026; | |
mov.u32 %r15716, %r2025; | |
mov.u32 %r15717, %r2024; | |
mov.u32 %r15718, %r2023; | |
mov.u32 %r15719, %r2022; | |
mov.u32 %r15720, %r2021; | |
mov.u32 %r15721, %r2020; | |
mov.u32 %r15722, %r2019; | |
mov.u32 %r15723, %r2018; | |
mov.u32 %r15724, %r2017; | |
mov.u32 %r15725, %r2016; | |
mov.u32 %r15726, %r2015; | |
mov.u32 %r15727, %r2014; | |
mov.u32 %r15728, %r2013; | |
mov.u32 %r15729, %r2012; | |
mov.u32 %r15730, %r2011; | |
mov.u32 %r15731, %r2010; | |
mov.u32 %r15732, %r2009; | |
mov.u32 %r15733, %r2008; | |
mov.u32 %r15734, %r2007; | |
mov.u32 %r15735, %r2006; | |
mov.u32 %r15736, %r2005; | |
mov.u32 %r15737, %r2004; | |
mov.u32 %r15738, %r2003; | |
mov.u32 %r15739, %r2002; | |
mov.u32 %r15740, %r2001; | |
mov.u32 %r15741, %r2000; | |
mov.u32 %r15742, %r1999; | |
mov.u32 %r15743, %r1998; | |
mov.u32 %r15744, %r1997; | |
mov.u32 %r15745, %r1996; | |
mov.u32 %r15746, %r1995; | |
mov.u32 %r15747, %r1994; | |
mov.u32 %r15748, %r1993; | |
@%p260 bra BB12_516; | |
st.local.v4.u32 [%rd2+512], {%r2056, %r2055, %r2054, %r2053}; | |
st.local.v4.u32 [%rd2+768], {%r15621, %r15622, %r15623, %r15624}; | |
st.local.v4.u32 [%rd2+528], {%r2052, %r2051, %r2050, %r2049}; | |
st.local.v4.u32 [%rd2+784], {%r15625, %r15626, %r15627, %r15628}; | |
st.local.v4.u32 [%rd2+544], {%r2048, %r2047, %r2046, %r2045}; | |
st.local.v4.u32 [%rd2+800], {%r15629, %r15630, %r15631, %r15632}; | |
st.local.v4.u32 [%rd2+560], {%r2044, %r2043, %r2042, %r2041}; | |
st.local.v4.u32 [%rd2+816], {%r15633, %r15634, %r15635, %r15636}; | |
st.local.v4.u32 [%rd2+576], {%r2040, %r2039, %r2038, %r2037}; | |
st.local.v4.u32 [%rd2+832], {%r15637, %r15638, %r15639, %r15640}; | |
st.local.v4.u32 [%rd2+592], {%r2036, %r2035, %r2034, %r2033}; | |
st.local.v4.u32 [%rd2+848], {%r15641, %r15642, %r15643, %r15644}; | |
st.local.v4.u32 [%rd2+608], {%r2032, %r2031, %r2030, %r2029}; | |
st.local.v4.u32 [%rd2+864], {%r15645, %r15646, %r15647, %r15648}; | |
st.local.v4.u32 [%rd2+624], {%r2028, %r2027, %r2026, %r2025}; | |
st.local.v4.u32 [%rd2+880], {%r15649, %r15650, %r15651, %r15652}; | |
st.local.v4.u32 [%rd2+640], {%r2024, %r2023, %r2022, %r2021}; | |
st.local.v4.u32 [%rd2+896], {%r15653, %r15654, %r15655, %r15656}; | |
st.local.v2.u32 [%rd2+912], {%r15657, %r15658}; | |
st.local.u32 [%rd2+920], %r15659; | |
st.local.v4.u32 [%rd2+656], {%r2020, %r2019, %r2018, %r2017}; | |
st.local.u32 [%rd2+924], %r15660; | |
st.local.u32 [%rd2+672], %r2016; | |
st.local.u32 [%rd2+928], %r15661; | |
st.local.u32 [%rd2+676], %r2015; | |
st.local.u32 [%rd2+932], %r15662; | |
st.local.u32 [%rd2+680], %r2014; | |
st.local.u32 [%rd2+936], %r15663; | |
st.local.u32 [%rd2+684], %r2013; | |
st.local.u32 [%rd2+940], %r15664; | |
st.local.u32 [%rd2+688], %r2012; | |
st.local.u32 [%rd2+944], %r15665; | |
st.local.u32 [%rd2+692], %r2011; | |
st.local.u32 [%rd2+948], %r15666; | |
st.local.u32 [%rd2+696], %r2010; | |
st.local.u32 [%rd2+952], %r15667; | |
st.local.u32 [%rd2+700], %r2009; | |
st.local.u32 [%rd2+956], %r15668; | |
st.local.u32 [%rd2+704], %r2008; | |
st.local.u32 [%rd2+960], %r15669; | |
st.local.u32 [%rd2+708], %r2007; | |
st.local.u32 [%rd2+964], %r15670; | |
st.local.u32 [%rd2+712], %r2006; | |
st.local.u32 [%rd2+968], %r15671; | |
st.local.u32 [%rd2+716], %r2005; | |
st.local.u32 [%rd2+972], %r15672; | |
st.local.u32 [%rd2+720], %r2004; | |
st.local.u32 [%rd2+976], %r15673; | |
st.local.u32 [%rd2+724], %r2003; | |
st.local.u32 [%rd2+980], %r15674; | |
st.local.u32 [%rd2+728], %r2002; | |
st.local.u32 [%rd2+984], %r15675; | |
st.local.u32 [%rd2+732], %r2001; | |
st.local.u32 [%rd2+988], %r15676; | |
st.local.u32 [%rd2+736], %r2000; | |
st.local.u32 [%rd2+992], %r15677; | |
st.local.u32 [%rd2+740], %r1999; | |
st.local.u32 [%rd2+996], %r15678; | |
st.local.u32 [%rd2+744], %r1998; | |
st.local.u32 [%rd2+1000], %r15679; | |
st.local.u32 [%rd2+748], %r1997; | |
st.local.u32 [%rd2+1004], %r15680; | |
st.local.u32 [%rd2+752], %r1996; | |
st.local.u32 [%rd2+1008], %r15681; | |
st.local.u32 [%rd2+756], %r1995; | |
st.local.u32 [%rd2+1012], %r15682; | |
st.local.u32 [%rd2+760], %r1994; | |
st.local.u32 [%rd2+1016], %r15683; | |
st.local.u32 [%rd2+764], %r1993; | |
st.local.u32 [%rd2+1020], %r15684; | |
mov.u32 %r14662, %r15684; | |
mov.u32 %r14664, %r15683; | |
mov.u32 %r14666, %r15682; | |
mov.u32 %r14668, %r15681; | |
mov.u32 %r14670, %r15680; | |
mov.u32 %r14672, %r15679; | |
mov.u32 %r14674, %r15678; | |
mov.u32 %r14676, %r15677; | |
mov.u32 %r14678, %r15676; | |
mov.u32 %r14680, %r15675; | |
mov.u32 %r14682, %r15674; | |
mov.u32 %r14684, %r15673; | |
mov.u32 %r14686, %r15672; | |
mov.u32 %r14688, %r15671; | |
mov.u32 %r14690, %r15670; | |
mov.u32 %r14692, %r15669; | |
mov.u32 %r14694, %r15668; | |
mov.u32 %r14696, %r15667; | |
mov.u32 %r14698, %r15666; | |
mov.u32 %r14700, %r15665; | |
mov.u32 %r14702, %r15664; | |
mov.u32 %r14704, %r15663; | |
mov.u32 %r14706, %r15662; | |
mov.u32 %r14708, %r15661; | |
mov.u32 %r14710, %r15660; | |
mov.u32 %r14712, %r15659; | |
mov.u32 %r14714, %r15658; | |
mov.u32 %r14716, %r15657; | |
mov.u32 %r14718, %r15656; | |
mov.u32 %r14720, %r15655; | |
mov.u32 %r14722, %r15654; | |
mov.u32 %r14724, %r15653; | |
mov.u32 %r14726, %r15652; | |
mov.u32 %r14728, %r15651; | |
mov.u32 %r14730, %r15650; | |
mov.u32 %r14732, %r15649; | |
mov.u32 %r14734, %r15648; | |
mov.u32 %r14736, %r15647; | |
mov.u32 %r14738, %r15646; | |
mov.u32 %r14740, %r15645; | |
mov.u32 %r14742, %r15644; | |
mov.u32 %r14744, %r15643; | |
mov.u32 %r14746, %r15642; | |
mov.u32 %r14748, %r15641; | |
mov.u32 %r14750, %r15640; | |
mov.u32 %r14752, %r15639; | |
mov.u32 %r14754, %r15638; | |
mov.u32 %r14756, %r15637; | |
mov.u32 %r14758, %r15636; | |
mov.u32 %r14760, %r15635; | |
mov.u32 %r14762, %r15634; | |
mov.u32 %r14764, %r15633; | |
mov.u32 %r14766, %r15632; | |
mov.u32 %r14768, %r15631; | |
mov.u32 %r14770, %r15630; | |
mov.u32 %r14772, %r15629; | |
mov.u32 %r14774, %r15628; | |
mov.u32 %r14776, %r15627; | |
mov.u32 %r14778, %r15626; | |
mov.u32 %r14780, %r15625; | |
mov.u32 %r14782, %r15624; | |
mov.u32 %r14784, %r15623; | |
mov.u32 %r14786, %r15622; | |
mov.u32 %r14788, %r15621; | |
mov.u32 %r15684, %r1993; | |
mov.u32 %r15683, %r1994; | |
mov.u32 %r15682, %r1995; | |
mov.u32 %r15681, %r1996; | |
mov.u32 %r15680, %r1997; | |
mov.u32 %r15679, %r1998; | |
mov.u32 %r15678, %r1999; | |
mov.u32 %r15677, %r2000; | |
mov.u32 %r15676, %r2001; | |
mov.u32 %r15675, %r2002; | |
mov.u32 %r15674, %r2003; | |
mov.u32 %r15673, %r2004; | |
mov.u32 %r15672, %r2005; | |
mov.u32 %r15671, %r2006; | |
mov.u32 %r15670, %r2007; | |
mov.u32 %r15669, %r2008; | |
mov.u32 %r15668, %r2009; | |
mov.u32 %r15667, %r2010; | |
mov.u32 %r15666, %r2011; | |
mov.u32 %r15665, %r2012; | |
mov.u32 %r15664, %r2013; | |
mov.u32 %r15663, %r2014; | |
mov.u32 %r15662, %r2015; | |
mov.u32 %r15661, %r2016; | |
mov.u32 %r15660, %r2017; | |
mov.u32 %r15659, %r2018; | |
mov.u32 %r15658, %r2019; | |
mov.u32 %r15657, %r2020; | |
mov.u32 %r15656, %r2021; | |
mov.u32 %r15655, %r2022; | |
mov.u32 %r15654, %r2023; | |
mov.u32 %r15653, %r2024; | |
mov.u32 %r15652, %r2025; | |
mov.u32 %r15651, %r2026; | |
mov.u32 %r15650, %r2027; | |
mov.u32 %r15649, %r2028; | |
mov.u32 %r15648, %r2029; | |
mov.u32 %r15647, %r2030; | |
mov.u32 %r15646, %r2031; | |
mov.u32 %r15645, %r2032; | |
mov.u32 %r15644, %r2033; | |
mov.u32 %r15643, %r2034; | |
mov.u32 %r15642, %r2035; | |
mov.u32 %r15641, %r2036; | |
mov.u32 %r15640, %r2037; | |
mov.u32 %r15639, %r2038; | |
mov.u32 %r15638, %r2039; | |
mov.u32 %r15637, %r2040; | |
mov.u32 %r15636, %r2041; | |
mov.u32 %r15635, %r2042; | |
mov.u32 %r15634, %r2043; | |
mov.u32 %r15633, %r2044; | |
mov.u32 %r15632, %r2045; | |
mov.u32 %r15631, %r2046; | |
mov.u32 %r15630, %r2047; | |
mov.u32 %r15629, %r2048; | |
mov.u32 %r15628, %r2049; | |
mov.u32 %r15627, %r2050; | |
mov.u32 %r15626, %r2051; | |
mov.u32 %r15625, %r2052; | |
mov.u32 %r15624, %r2053; | |
mov.u32 %r15623, %r2054; | |
mov.u32 %r15622, %r2055; | |
mov.u32 %r15621, %r2056; | |
mov.u32 %r15685, %r14788; | |
mov.u32 %r15686, %r14786; | |
mov.u32 %r15687, %r14784; | |
mov.u32 %r15688, %r14782; | |
mov.u32 %r15689, %r14780; | |
mov.u32 %r15690, %r14778; | |
mov.u32 %r15691, %r14776; | |
mov.u32 %r15692, %r14774; | |
mov.u32 %r15693, %r14772; | |
mov.u32 %r15694, %r14770; | |
mov.u32 %r15695, %r14768; | |
mov.u32 %r15696, %r14766; | |
mov.u32 %r15697, %r14764; | |
mov.u32 %r15698, %r14762; | |
mov.u32 %r15699, %r14760; | |
mov.u32 %r15700, %r14758; | |
mov.u32 %r15701, %r14756; | |
mov.u32 %r15702, %r14754; | |
mov.u32 %r15703, %r14752; | |
mov.u32 %r15704, %r14750; | |
mov.u32 %r15705, %r14748; | |
mov.u32 %r15706, %r14746; | |
mov.u32 %r15707, %r14744; | |
mov.u32 %r15708, %r14742; | |
mov.u32 %r15709, %r14740; | |
mov.u32 %r15710, %r14738; | |
mov.u32 %r15711, %r14736; | |
mov.u32 %r15712, %r14734; | |
mov.u32 %r15713, %r14732; | |
mov.u32 %r15714, %r14730; | |
mov.u32 %r15715, %r14728; | |
mov.u32 %r15716, %r14726; | |
mov.u32 %r15717, %r14724; | |
mov.u32 %r15718, %r14722; | |
mov.u32 %r15719, %r14720; | |
mov.u32 %r15720, %r14718; | |
mov.u32 %r15721, %r14716; | |
mov.u32 %r15722, %r14714; | |
mov.u32 %r15723, %r14712; | |
mov.u32 %r15724, %r14710; | |
mov.u32 %r15725, %r14708; | |
mov.u32 %r15726, %r14706; | |
mov.u32 %r15727, %r14704; | |
mov.u32 %r15728, %r14702; | |
mov.u32 %r15729, %r14700; | |
mov.u32 %r15730, %r14698; | |
mov.u32 %r15731, %r14696; | |
mov.u32 %r15732, %r14694; | |
mov.u32 %r15733, %r14692; | |
mov.u32 %r15734, %r14690; | |
mov.u32 %r15735, %r14688; | |
mov.u32 %r15736, %r14686; | |
mov.u32 %r15737, %r14684; | |
mov.u32 %r15738, %r14682; | |
mov.u32 %r15739, %r14680; | |
mov.u32 %r15740, %r14678; | |
mov.u32 %r15741, %r14676; | |
mov.u32 %r15742, %r14674; | |
mov.u32 %r15743, %r14672; | |
mov.u32 %r15744, %r14670; | |
mov.u32 %r15745, %r14668; | |
mov.u32 %r15746, %r14666; | |
mov.u32 %r15747, %r14664; | |
mov.u32 %r15748, %r14662; | |
BB12_516: | |
setp.le.u32 %p261, %r13061, %r15621; | |
@%p261 bra BB12_518; | |
st.local.v4.u32 [%rd2], {%r15621, %r15622, %r15623, %r15624}; | |
st.local.v4.u32 [%rd2+512], {%r13061, %r13062, %r13063, %r13064}; | |
st.local.v4.u32 [%rd2+16], {%r15625, %r15626, %r15627, %r15628}; | |
st.local.v4.u32 [%rd2+528], {%r13065, %r13066, %r13067, %r13068}; | |
st.local.v4.u32 [%rd2+32], {%r15629, %r15630, %r15631, %r15632}; | |
st.local.v4.u32 [%rd2+544], {%r13069, %r13070, %r13071, %r13072}; | |
st.local.v4.u32 [%rd2+48], {%r15633, %r15634, %r15635, %r15636}; | |
st.local.v4.u32 [%rd2+560], {%r13073, %r13074, %r13075, %r13076}; | |
st.local.v4.u32 [%rd2+64], {%r15637, %r15638, %r15639, %r15640}; | |
st.local.v4.u32 [%rd2+576], {%r13077, %r13078, %r13079, %r13080}; | |
st.local.v4.u32 [%rd2+80], {%r15641, %r15642, %r15643, %r15644}; | |
st.local.v4.u32 [%rd2+592], {%r13081, %r13082, %r13083, %r13084}; | |
st.local.v4.u32 [%rd2+96], {%r15645, %r15646, %r15647, %r15648}; | |
st.local.v4.u32 [%rd2+608], {%r13085, %r13086, %r13087, %r13088}; | |
st.local.v4.u32 [%rd2+112], {%r15649, %r15650, %r15651, %r15652}; | |
st.local.v4.u32 [%rd2+624], {%r13089, %r13090, %r13091, %r13092}; | |
st.local.v4.u32 [%rd2+128], {%r15653, %r15654, %r15655, %r15656}; | |
st.local.v4.u32 [%rd2+640], {%r13093, %r13094, %r13095, %r13096}; | |
st.local.v2.u32 [%rd2+656], {%r13097, %r13098}; | |
st.local.u32 [%rd2+664], %r13099; | |
st.local.v4.u32 [%rd2+144], {%r15657, %r15658, %r15659, %r15660}; | |
st.local.u32 [%rd2+668], %r13100; | |
st.local.u32 [%rd2+160], %r15661; | |
st.local.u32 [%rd2+672], %r13101; | |
st.local.u32 [%rd2+164], %r15662; | |
st.local.u32 [%rd2+676], %r13102; | |
st.local.u32 [%rd2+168], %r15663; | |
st.local.u32 [%rd2+680], %r13103; | |
st.local.u32 [%rd2+172], %r15664; | |
st.local.u32 [%rd2+684], %r13104; | |
st.local.u32 [%rd2+176], %r15665; | |
st.local.u32 [%rd2+688], %r13105; | |
st.local.u32 [%rd2+180], %r15666; | |
st.local.u32 [%rd2+692], %r13106; | |
st.local.u32 [%rd2+184], %r15667; | |
st.local.u32 [%rd2+696], %r13107; | |
st.local.u32 [%rd2+188], %r15668; | |
st.local.u32 [%rd2+700], %r13108; | |
st.local.u32 [%rd2+192], %r15669; | |
st.local.u32 [%rd2+704], %r13109; | |
st.local.u32 [%rd2+196], %r15670; | |
st.local.u32 [%rd2+708], %r13110; | |
st.local.u32 [%rd2+200], %r15671; | |
st.local.u32 [%rd2+712], %r13111; | |
st.local.u32 [%rd2+204], %r15672; | |
st.local.u32 [%rd2+716], %r13112; | |
st.local.u32 [%rd2+208], %r15673; | |
st.local.u32 [%rd2+720], %r13113; | |
st.local.u32 [%rd2+212], %r15674; | |
st.local.u32 [%rd2+724], %r13114; | |
st.local.u32 [%rd2+216], %r15675; | |
st.local.u32 [%rd2+728], %r13115; | |
st.local.u32 [%rd2+220], %r15676; | |
st.local.u32 [%rd2+732], %r13116; | |
st.local.u32 [%rd2+224], %r15677; | |
st.local.u32 [%rd2+736], %r13117; | |
st.local.u32 [%rd2+228], %r15678; | |
st.local.u32 [%rd2+740], %r13118; | |
st.local.u32 [%rd2+232], %r15679; | |
st.local.u32 [%rd2+744], %r13119; | |
st.local.u32 [%rd2+236], %r15680; | |
st.local.u32 [%rd2+748], %r13120; | |
st.local.u32 [%rd2+240], %r15681; | |
st.local.u32 [%rd2+752], %r13121; | |
st.local.u32 [%rd2+244], %r15682; | |
st.local.u32 [%rd2+756], %r13122; | |
st.local.u32 [%rd2+248], %r15683; | |
st.local.u32 [%rd2+760], %r13123; | |
st.local.u32 [%rd2+252], %r15684; | |
st.local.u32 [%rd2+764], %r13124; | |
st.local.u32 [%rd2+256], %r15685; | |
st.local.u32 [%rd2+768], %r13125; | |
st.local.u32 [%rd2+260], %r15686; | |
st.local.u32 [%rd2+772], %r13126; | |
st.local.u32 [%rd2+264], %r15687; | |
st.local.u32 [%rd2+776], %r13127; | |
st.local.u32 [%rd2+268], %r15688; | |
st.local.u32 [%rd2+780], %r13128; | |
st.local.u32 [%rd2+272], %r15689; | |
st.local.u32 [%rd2+784], %r13129; | |
st.local.u32 [%rd2+276], %r15690; | |
st.local.u32 [%rd2+788], %r13130; | |
st.local.u32 [%rd2+280], %r15691; | |
st.local.u32 [%rd2+792], %r13131; | |
st.local.u32 [%rd2+284], %r15692; | |
st.local.u32 [%rd2+796], %r13132; | |
st.local.u32 [%rd2+288], %r15693; | |
st.local.u32 [%rd2+800], %r13133; | |
st.local.u32 [%rd2+292], %r15694; | |
st.local.u32 [%rd2+804], %r13134; | |
st.local.u32 [%rd2+296], %r15695; | |
st.local.u32 [%rd2+808], %r13135; | |
st.local.u32 [%rd2+300], %r15696; | |
st.local.u32 [%rd2+812], %r13136; | |
st.local.u32 [%rd2+304], %r15697; | |
st.local.u32 [%rd2+816], %r13137; | |
st.local.u32 [%rd2+308], %r15698; | |
st.local.u32 [%rd2+820], %r13138; | |
st.local.u32 [%rd2+312], %r15699; | |
st.local.u32 [%rd2+824], %r13139; | |
st.local.u32 [%rd2+316], %r15700; | |
st.local.u32 [%rd2+828], %r13140; | |
st.local.u32 [%rd2+320], %r15701; | |
st.local.u32 [%rd2+832], %r13141; | |
st.local.u32 [%rd2+324], %r15702; | |
st.local.u32 [%rd2+836], %r13142; | |
st.local.u32 [%rd2+328], %r15703; | |
st.local.u32 [%rd2+840], %r13143; | |
st.local.u32 [%rd2+332], %r15704; | |
st.local.u32 [%rd2+844], %r13144; | |
st.local.u32 [%rd2+336], %r15705; | |
st.local.u32 [%rd2+848], %r13145; | |
st.local.u32 [%rd2+340], %r15706; | |
st.local.u32 [%rd2+852], %r13146; | |
st.local.u32 [%rd2+344], %r15707; | |
st.local.u32 [%rd2+856], %r13147; | |
st.local.u32 [%rd2+348], %r15708; | |
st.local.u32 [%rd2+860], %r13148; | |
st.local.u32 [%rd2+352], %r15709; | |
st.local.u32 [%rd2+864], %r13149; | |
st.local.u32 [%rd2+356], %r15710; | |
st.local.u32 [%rd2+868], %r13150; | |
st.local.u32 [%rd2+360], %r15711; | |
st.local.u32 [%rd2+872], %r13151; | |
st.local.u32 [%rd2+364], %r15712; | |
st.local.u32 [%rd2+876], %r13152; | |
st.local.u32 [%rd2+368], %r15713; | |
st.local.u32 [%rd2+880], %r13153; | |
st.local.u32 [%rd2+372], %r15714; | |
st.local.u32 [%rd2+884], %r13154; | |
st.local.u32 [%rd2+376], %r15715; | |
st.local.u32 [%rd2+888], %r13155; | |
st.local.u32 [%rd2+380], %r15716; | |
st.local.u32 [%rd2+892], %r13156; | |
st.local.u32 [%rd2+384], %r15717; | |
st.local.u32 [%rd2+896], %r13157; | |
st.local.u32 [%rd2+388], %r15718; | |
st.local.u32 [%rd2+900], %r13158; | |
st.local.u32 [%rd2+392], %r15719; | |
st.local.u32 [%rd2+904], %r13159; | |
st.local.u32 [%rd2+396], %r15720; | |
st.local.u32 [%rd2+908], %r13160; | |
st.local.u32 [%rd2+400], %r15721; | |
st.local.u32 [%rd2+912], %r13161; | |
st.local.u32 [%rd2+404], %r15722; | |
st.local.u32 [%rd2+916], %r13162; | |
st.local.u32 [%rd2+408], %r15723; | |
st.local.u32 [%rd2+920], %r13163; | |
st.local.u32 [%rd2+412], %r15724; | |
st.local.u32 [%rd2+924], %r13164; | |
st.local.u32 [%rd2+416], %r15725; | |
st.local.u32 [%rd2+928], %r13165; | |
st.local.u32 [%rd2+420], %r15726; | |
st.local.u32 [%rd2+932], %r13166; | |
st.local.u32 [%rd2+424], %r15727; | |
st.local.u32 [%rd2+936], %r13167; | |
st.local.u32 [%rd2+428], %r15728; | |
st.local.u32 [%rd2+940], %r13168; | |
st.local.u32 [%rd2+432], %r15729; | |
st.local.u32 [%rd2+944], %r13169; | |
st.local.u32 [%rd2+436], %r15730; | |
st.local.u32 [%rd2+948], %r13170; | |
st.local.u32 [%rd2+440], %r15731; | |
st.local.u32 [%rd2+952], %r13171; | |
st.local.u32 [%rd2+444], %r15732; | |
st.local.u32 [%rd2+956], %r13172; | |
st.local.u32 [%rd2+448], %r15733; | |
st.local.u32 [%rd2+960], %r13173; | |
st.local.u32 [%rd2+452], %r15734; | |
st.local.u32 [%rd2+964], %r13174; | |
st.local.u32 [%rd2+456], %r15735; | |
st.local.u32 [%rd2+968], %r13175; | |
st.local.u32 [%rd2+460], %r15736; | |
st.local.u32 [%rd2+972], %r13176; | |
st.local.u32 [%rd2+464], %r15737; | |
st.local.u32 [%rd2+976], %r13177; | |
st.local.u32 [%rd2+468], %r15738; | |
st.local.u32 [%rd2+980], %r13178; | |
st.local.u32 [%rd2+472], %r15739; | |
st.local.u32 [%rd2+984], %r13179; | |
st.local.u32 [%rd2+476], %r15740; | |
st.local.u32 [%rd2+988], %r13180; | |
st.local.u32 [%rd2+480], %r15741; | |
st.local.u32 [%rd2+992], %r13181; | |
st.local.u32 [%rd2+484], %r15742; | |
st.local.u32 [%rd2+996], %r13182; | |
st.local.u32 [%rd2+488], %r15743; | |
st.local.u32 [%rd2+1000], %r13183; | |
st.local.u32 [%rd2+492], %r15744; | |
st.local.u32 [%rd2+1004], %r13184; | |
st.local.u32 [%rd2+496], %r15745; | |
st.local.u32 [%rd2+1008], %r13185; | |
st.local.u32 [%rd2+500], %r15746; | |
st.local.u32 [%rd2+1012], %r13186; | |
st.local.u32 [%rd2+504], %r15747; | |
st.local.u32 [%rd2+1016], %r13187; | |
st.local.u32 [%rd2+508], %r15748; | |
st.local.u32 [%rd2+1020], %r13188; | |
BB12_518: | |
shl.b32 %r11393, %r11395, 22; | |
add.u64 %rd5890, %SP, 1024; | |
or.b32 %r7160, %r9, %r11393; | |
bfe.u32 %r7161, %r7160, 22, 6; | |
mul.wide.u32 %rd2239, %r7161, 28; | |
add.s64 %rd142, %rd451, %rd2239; | |
ld.global.u32 %r7162, [%rd142]; | |
add.s64 %rd2241, %rd5890, 1024; | |
// Callseq Start 0 | |
{ | |
.reg .b32 temp_param_reg; | |
// <end>} | |
.param .b64 param0; | |
st.param.b64 [param0+0], %rd414; | |
.param .b64 param1; | |
st.param.b64 [param1+0], %rd415; | |
.param .b32 param2; | |
st.param.b32 [param2+0], %r7162; | |
.param .b64 param3; | |
st.param.b64 [param3+0], %rd2241; | |
call.uni | |
local_listindices8, | |
( | |
param0, | |
param1, | |
param2, | |
param3 | |
); | |
//{ | |
}// Callseq End 0 | |
ld.local.u32 %r7163, [%rd2+1024]; | |
ld.local.u32 %r16517, [%rd2]; | |
mov.u32 %r7159, 0; | |
mov.u32 %r16518, %r7159; | |
setp.le.u32 %p262, %r16517, %r7163; | |
mov.u32 %r16522, %r7159; | |
@%p262 bra BB12_521; | |
bra.uni BB12_519; | |
BB12_520: | |
ld.local.u32 %r16517, [%rd143+64]; | |
BB12_519: | |
mov.u32 %r2186, %r16517; | |
mul.wide.u32 %rd2242, %r16518, 4; | |
add.s64 %rd143, %rd2, %rd2242; | |
ld.local.v4.u32 {%r7165, %r7166, %r7167, %r7168}, [%rd143+1024]; | |
ld.local.u32 %r7173, [%rd143+4]; | |
ld.local.v2.u32 {%r7174, %r7175}, [%rd143+8]; | |
ld.local.v4.u32 {%r7178, %r7179, %r7180, %r7181}, [%rd143+16]; | |
ld.local.v4.u32 {%r7182, %r7183, %r7184, %r7185}, [%rd143+1040]; | |
ld.local.v4.u32 {%r7186, %r7187, %r7188, %r7189}, [%rd143+32]; | |
ld.local.v4.u32 {%r7190, %r7191, %r7192, %r7193}, [%rd143+1056]; | |
ld.local.v2.u32 {%r7194, %r7195}, [%rd143+48]; | |
ld.local.v2.u32 {%r7196, %r7197}, [%rd143+1072]; | |
st.local.v4.u32 [%rd143], {%r7165, %r7166, %r7167, %r7168}; | |
st.local.v4.u32 [%rd143+1024], {%r2186, %r7173, %r7174, %r7175}; | |
st.local.v4.u32 [%rd143+16], {%r7182, %r7183, %r7184, %r7185}; | |
st.local.v4.u32 [%rd143+1040], {%r7178, %r7179, %r7180, %r7181}; | |
st.local.v4.u32 [%rd143+32], {%r7190, %r7191, %r7192, %r7193}; | |
st.local.v4.u32 [%rd143+1056], {%r7186, %r7187, %r7188, %r7189}; | |
st.local.v2.u32 [%rd143+48], {%r7196, %r7197}; | |
st.local.v2.u32 [%rd143+1072], {%r7194, %r7195}; | |
ld.local.v2.u32 {%r7218, %r7219}, [%rd143+1080]; | |
ld.local.v2.u32 {%r7222, %r7223}, [%rd143+56]; | |
st.local.v2.u32 [%rd143+56], {%r7218, %r7219}; | |
st.local.v2.u32 [%rd143+1080], {%r7222, %r7223}; | |
add.s32 %r16518, %r16518, 16; | |
setp.eq.s32 %p263, %r16518, 256; | |
mov.u32 %r16520, %r7159; | |
mov.u32 %r16522, %r16520; | |
@%p263 bra BB12_521; | |
bra.uni BB12_520; | |
BB12_521: | |
mov.u32 %r2190, %r16522; | |
mul.wide.u32 %rd2243, %r2190, 2; | |
add.s64 %rd2244, %rd1, %rd2243; | |
mov.u16 %rs13, -1; | |
st.local.u16 [%rd2244], %rs13; | |
st.local.u16 [%rd2244+62], %rs13; | |
mov.u64 %rd2245, 65535; | |
st.local.u16 [%rd2244+8], %rd2245; | |
st.local.u16 [%rd2244+6], %rd2245; | |
st.local.u16 [%rd2244+4], %rd2245; | |
st.local.u16 [%rd2244+2], %rd2245; | |
st.local.u16 [%rd2244+16], %rd2245; | |
st.local.u16 [%rd2244+14], %rd2245; | |
st.local.u16 [%rd2244+12], %rd2245; | |
st.local.u16 [%rd2244+10], %rd2245; | |
st.local.u16 [%rd2244+24], %rd2245; | |
st.local.u16 [%rd2244+22], %rd2245; | |
st.local.u16 [%rd2244+20], %rd2245; | |
st.local.u16 [%rd2244+18], %rd2245; | |
st.local.u16 [%rd2244+32], %rd2245; | |
st.local.u16 [%rd2244+30], %rd2245; | |
st.local.u16 [%rd2244+28], %rd2245; | |
st.local.u16 [%rd2244+26], %rd2245; | |
st.local.u16 [%rd2244+40], %rd2245; | |
st.local.u16 [%rd2244+38], %rd2245; | |
st.local.u16 [%rd2244+36], %rd2245; | |
st.local.u16 [%rd2244+34], %rd2245; | |
st.local.u16 [%rd2244+48], %rd2245; | |
st.local.u16 [%rd2244+46], %rd2245; | |
st.local.u16 [%rd2244+44], %rd2245; | |
st.local.u16 [%rd2244+42], %rd2245; | |
st.local.u16 [%rd2244+56], %rd2245; | |
st.local.u16 [%rd2244+54], %rd2245; | |
st.local.u16 [%rd2244+52], %rd2245; | |
st.local.u16 [%rd2244+50], %rd2245; | |
mov.u32 %r7227, 65535; | |
st.local.u16 [%rd2244+60], %r7227; | |
st.local.u16 [%rd2244+58], %r7227; | |
add.s32 %r2191, %r2190, 32; | |
setp.ne.s32 %p264, %r2191, 512; | |
mov.u32 %r16521, %r7159; | |
mov.u32 %r16522, %r2191; | |
@%p264 bra BB12_521; | |
BB12_522: | |
mul.wide.u32 %rd2246, %r16521, 4; | |
add.s64 %rd2247, %rd2, %rd2246; | |
ld.local.u32 %r7228, [%rd2247]; | |
and.b32 %r7229, %r7228, 511; | |
shr.u32 %r7230, %r7228, 9; | |
mul.wide.u32 %rd2248, %r7229, 2; | |
add.s64 %rd144, %rd1, %rd2248; | |
cvt.u16.u32 %rs3, %r7230; | |
ld.local.u16 %rs14, [%rd144]; | |
setp.eq.s16 %p265, %rs14, %rs3; | |
@%p265 bra BB12_1566; | |
st.local.u16 [%rd144], %rs3; | |
add.s32 %r7231, %r16521, 1; | |
mul.wide.u32 %rd2249, %r7231, 4; | |
add.s64 %rd2250, %rd2, %rd2249; | |
ld.local.u32 %r7232, [%rd2250]; | |
and.b32 %r7233, %r7232, 511; | |
shr.u32 %r7234, %r7232, 9; | |
mul.wide.u32 %rd2251, %r7233, 2; | |
add.s64 %rd145, %rd1, %rd2251; | |
cvt.u16.u32 %rs4, %r7234; | |
ld.local.u16 %rs15, [%rd145]; | |
setp.eq.s16 %p266, %rs15, %rs4; | |
@%p266 bra BB12_1566; | |
st.local.u16 [%rd145], %rs4; | |
add.s32 %r7235, %r16521, 2; | |
mul.wide.u32 %rd2252, %r7235, 4; | |
add.s64 %rd2253, %rd2, %rd2252; | |
ld.local.u32 %r7236, [%rd2253]; | |
and.b32 %r7237, %r7236, 511; | |
shr.u32 %r7238, %r7236, 9; | |
mul.wide.u32 %rd2254, %r7237, 2; | |
add.s64 %rd146, %rd1, %rd2254; | |
cvt.u16.u32 %rs5, %r7238; | |
ld.local.u16 %rs16, [%rd146]; | |
setp.eq.s16 %p267, %rs16, %rs5; | |
@%p267 bra BB12_1566; | |
st.local.u16 [%rd146], %rs5; | |
add.s32 %r7239, %r16521, 3; | |
mul.wide.u32 %rd2255, %r7239, 4; | |
add.s64 %rd2256, %rd2, %rd2255; | |
ld.local.u32 %r7240, [%rd2256]; | |
and.b32 %r7241, %r7240, 511; | |
shr.u32 %r7242, %r7240, 9; | |
mul.wide.u32 %rd2257, %r7241, 2; | |
add.s64 %rd147, %rd1, %rd2257; | |
cvt.u16.u32 %rs6, %r7242; | |
ld.local.u16 %rs17, [%rd147]; | |
setp.eq.s16 %p268, %rs17, %rs6; | |
@%p268 bra BB12_1566; | |
st.local.u16 [%rd147], %rs6; | |
add.s32 %r7243, %r16521, 4; | |
mul.wide.u32 %rd2258, %r7243, 4; | |
add.s64 %rd2259, %rd2, %rd2258; | |
ld.local.u32 %r7244, [%rd2259]; | |
and.b32 %r7245, %r7244, 511; | |
shr.u32 %r7246, %r7244, 9; | |
mul.wide.u32 %rd2260, %r7245, 2; | |
add.s64 %rd148, %rd1, %rd2260; | |
cvt.u16.u32 %rs7, %r7246; | |
ld.local.u16 %rs18, [%rd148]; | |
setp.eq.s16 %p269, %rs18, %rs7; | |
@%p269 bra BB12_1566; | |
st.local.u16 [%rd148], %rs7; | |
add.s32 %r7247, %r16521, 5; | |
mul.wide.u32 %rd2261, %r7247, 4; | |
add.s64 %rd2262, %rd2, %rd2261; | |
ld.local.u32 %r7248, [%rd2262]; | |
and.b32 %r7249, %r7248, 511; | |
shr.u32 %r7250, %r7248, 9; | |
mul.wide.u32 %rd2263, %r7249, 2; | |
add.s64 %rd149, %rd1, %rd2263; | |
cvt.u16.u32 %rs8, %r7250; | |
ld.local.u16 %rs19, [%rd149]; | |
setp.eq.s16 %p270, %rs19, %rs8; | |
@%p270 bra BB12_1566; | |
st.local.u16 [%rd149], %rs8; | |
add.s32 %r7251, %r16521, 6; | |
mul.wide.u32 %rd2264, %r7251, 4; | |
add.s64 %rd2265, %rd2, %rd2264; | |
ld.local.u32 %r7252, [%rd2265]; | |
and.b32 %r7253, %r7252, 511; | |
shr.u32 %r7254, %r7252, 9; | |
mul.wide.u32 %rd2266, %r7253, 2; | |
add.s64 %rd150, %rd1, %rd2266; | |
cvt.u16.u32 %rs9, %r7254; | |
ld.local.u16 %rs20, [%rd150]; | |
setp.eq.s16 %p271, %rs20, %rs9; | |
@%p271 bra BB12_1566; | |
st.local.u16 [%rd150], %rs9; | |
add.s32 %r7255, %r16521, 7; | |
mul.wide.u32 %rd2267, %r7255, 4; | |
add.s64 %rd2268, %rd2, %rd2267; | |
ld.local.u32 %r7256, [%rd2268]; | |
and.b32 %r7257, %r7256, 511; | |
shr.u32 %r7258, %r7256, 9; | |
mul.wide.u32 %rd2269, %r7257, 2; | |
add.s64 %rd151, %rd1, %rd2269; | |
cvt.u16.u32 %rs10, %r7258; | |
ld.local.u16 %rs21, [%rd151]; | |
setp.eq.s16 %p272, %rs21, %rs10; | |
@%p272 bra BB12_1566; | |
st.local.u16 [%rd151], %rs10; | |
add.s32 %r16521, %r16521, 8; | |
setp.lt.u32 %p273, %r16521, 512; | |
@%p273 bra BB12_522; | |
ld.param.u64 %rd5891, [digitK_param_4]; | |
atom.global.add.u32 %r2194, [%rd5891], 1; | |
setp.gt.u32 %p274, %r2194, 7; | |
@%p274 bra BB12_1566; | |
ld.global.u32 %r2195, [%rd13]; | |
and.b32 %r7259, %r2195, 65535; | |
bfe.u32 %r7260, %r2195, 16, 6; | |
mul.wide.u32 %rd2270, %r7259, 1792; | |
add.s64 %rd2271, %rd6, %rd2270; | |
mul.wide.u32 %rd2272, %r7260, 28; | |
add.s64 %rd2273, %rd2271, %rd2272; | |
ld.global.u32 %r2196, [%rd2273]; | |
and.b32 %r7261, %r2196, 65535; | |
mul.wide.u32 %rd2274, %r7261, 1792; | |
add.s64 %rd2275, %rd4, %rd2274; | |
bfe.u32 %r7262, %r2196, 16, 6; | |
mul.wide.u32 %rd2276, %r7262, 28; | |
add.s64 %rd2277, %rd2275, %rd2276; | |
ld.global.u32 %r2197, [%rd2277+-4]; | |
and.b32 %r7263, %r2197, 65535; | |
mul.wide.u32 %rd2278, %r7263, 1792; | |
add.s64 %rd2279, %rd6, %rd2278; | |
bfe.u32 %r7264, %r2197, 16, 6; | |
mul.wide.u32 %rd2280, %r7264, 28; | |
add.s64 %rd2281, %rd2279, %rd2280; | |
ld.global.u32 %r2198, [%rd2281+-4]; | |
and.b32 %r7265, %r2198, 65535; | |
mul.wide.u32 %rd2282, %r7265, 1792; | |
add.s64 %rd2283, %rd4, %rd2282; | |
bfe.u32 %r7266, %r2198, 16, 6; | |
mul.wide.u32 %rd2284, %r7266, 28; | |
add.s64 %rd2285, %rd2283, %rd2284; | |
ld.global.u32 %r2199, [%rd2285+-8]; | |
and.b32 %r7267, %r2199, 65535; | |
mul.wide.u32 %rd2286, %r7267, 1792; | |
add.s64 %rd2287, %rd6, %rd2286; | |
bfe.u32 %r7268, %r2199, 16, 6; | |
mul.wide.u32 %rd2288, %r7268, 28; | |
add.s64 %rd2289, %rd2287, %rd2288; | |
ld.global.u32 %r2200, [%rd2289+-8]; | |
and.b32 %r7269, %r2200, 65535; | |
mul.wide.u32 %rd2290, %r7269, 1792; | |
add.s64 %rd2291, %rd4, %rd2290; | |
cvt.u64.u32 %rd152, %r2194; | |
mul.wide.u32 %rd2292, %r2194, 2048; | |
add.s64 %rd153, %rd417, %rd2292; | |
cvt.u64.u32 %rd154, %r7259; | |
cvt.u64.u32 %rd155, %r7261; | |
cvt.u64.u32 %rd156, %r7263; | |
cvt.u64.u32 %rd157, %r7265; | |
cvt.u64.u32 %rd158, %r7267; | |
cvt.u64.u32 %rd159, %r7269; | |
bfe.u32 %r7270, %r2200, 16, 6; | |
mul.wide.u32 %rd2293, %r7270, 28; | |
add.s64 %rd2294, %rd2291, %rd2293; | |
ld.global.u32 %r2201, [%rd2294+-12]; | |
and.b32 %r7271, %r2201, 65535; | |
cvt.u64.u32 %rd160, %r7271; | |
bfe.u32 %r7272, %r2201, 16, 6; | |
mul.wide.u32 %rd2295, %r7271, 1792; | |
add.s64 %rd2296, %rd415, %rd2295; | |
mul.wide.u32 %rd2297, %r7272, 28; | |
add.s64 %rd2298, %rd2296, %rd2297; | |
ld.global.u32 %r7273, [%rd2298]; | |
and.b32 %r7274, %r7273, 65535; | |
bfe.u32 %r7275, %r7273, 16, 6; | |
mul.wide.u32 %rd2299, %r7274, 1792; | |
add.s64 %rd2300, %rd414, %rd2299; | |
mul.wide.u32 %rd2301, %r7275, 28; | |
add.s64 %rd2302, %rd2300, %rd2301; | |
ld.global.u32 %r7276, [%rd2302]; | |
and.b32 %r7277, %r7276, 65535; | |
shl.b32 %r7278, %r7277, 6; | |
bfe.u32 %r7279, %r7276, 16, 6; | |
or.b32 %r2202, %r7278, %r7279; | |
st.global.u32 [%rd153], %r2202; | |
bfe.u32 %r7280, %r7273, 22, 6; | |
mul.wide.u32 %rd2303, %r7280, 28; | |
add.s64 %rd2304, %rd2300, %rd2303; | |
ld.global.u32 %r7281, [%rd2304]; | |
and.b32 %r7282, %r7281, 65535; | |
shl.b32 %r7283, %r7282, 6; | |
bfe.u32 %r7284, %r7281, 16, 6; | |
or.b32 %r18040, %r7283, %r7284; | |
st.global.u32 [%rd153+4], %r18040; | |
setp.le.u32 %p275, %r2202, %r18040; | |
mov.u32 %r18039, %r2202; | |
@%p275 bra BB12_534; | |
st.global.u32 [%rd153], %r18040; | |
st.global.u32 [%rd153+4], %r2202; | |
mov.u32 %r17236, %r18040; | |
mov.u32 %r18040, %r2202; | |
mov.u32 %r18039, %r17236; | |
BB12_534: | |
mov.u32 %r18035, %r18039; | |
mov.u32 %r18036, %r18040; | |
bfe.u32 %r7285, %r2201, 22, 6; | |
mul.lo.s64 %rd2305, %rd160, 1792; | |
add.s64 %rd2306, %rd415, %rd2305; | |
mul.wide.u32 %rd2307, %r7285, 28; | |
add.s64 %rd2308, %rd2306, %rd2307; | |
ld.global.u32 %r7286, [%rd2308]; | |
and.b32 %r7287, %r7286, 65535; | |
bfe.u32 %r7288, %r7286, 16, 6; | |
mul.wide.u32 %rd2309, %r7287, 1792; | |
add.s64 %rd2310, %rd414, %rd2309; | |
mul.wide.u32 %rd2311, %r7288, 28; | |
add.s64 %rd2312, %rd2310, %rd2311; | |
ld.global.u32 %r7289, [%rd2312]; | |
and.b32 %r7290, %r7289, 65535; | |
shl.b32 %r7291, %r7290, 6; | |
bfe.u32 %r7292, %r7289, 16, 6; | |
or.b32 %r2206, %r7291, %r7292; | |
st.global.u32 [%rd153+8], %r2206; | |
bfe.u32 %r7293, %r7286, 22, 6; | |
mul.wide.u32 %rd2313, %r7293, 28; | |
add.s64 %rd2314, %rd2310, %rd2313; | |
ld.global.u32 %r7294, [%rd2314]; | |
and.b32 %r7295, %r7294, 65535; | |
shl.b32 %r7296, %r7295, 6; | |
bfe.u32 %r7297, %r7294, 16, 6; | |
or.b32 %r18042, %r7296, %r7297; | |
st.global.u32 [%rd153+12], %r18042; | |
setp.le.u32 %p276, %r2206, %r18042; | |
mov.u32 %r18041, %r2206; | |
@%p276 bra BB12_536; | |
st.global.u32 [%rd153+8], %r18042; | |
st.global.u32 [%rd153+12], %r2206; | |
mov.u32 %r17242, %r18042; | |
mov.u32 %r18042, %r2206; | |
mov.u32 %r18041, %r17242; | |
BB12_536: | |
mov.u32 %r2209, %r18041; | |
mov.u32 %r2208, %r18042; | |
setp.le.u32 %p277, %r18035, %r2209; | |
mov.u32 %r18037, %r2209; | |
mov.u32 %r18038, %r2208; | |
@%p277 bra BB12_538; | |
st.global.u32 [%rd153], %r2209; | |
st.global.u32 [%rd153+8], %r18035; | |
st.global.u32 [%rd153+4], %r2208; | |
st.global.u32 [%rd153+12], %r18036; | |
mov.u32 %r17239, %r18036; | |
mov.u32 %r17241, %r18035; | |
mov.u32 %r18036, %r2208; | |
mov.u32 %r18035, %r2209; | |
mov.u32 %r18037, %r17241; | |
mov.u32 %r18038, %r17239; | |
BB12_538: | |
mov.u32 %r18027, %r18035; | |
mov.u32 %r18028, %r18036; | |
mov.u32 %r18029, %r18037; | |
mov.u32 %r18030, %r18038; | |
mul.lo.s64 %rd2315, %rd159, 1792; | |
add.s64 %rd2316, %rd4, %rd2315; | |
bfe.u32 %r7298, %r2200, 22, 6; | |
mul.wide.u32 %rd2317, %r7298, 28; | |
add.s64 %rd2318, %rd2316, %rd2317; | |
ld.global.u32 %r2214, [%rd2318+-12]; | |
and.b32 %r7299, %r2214, 65535; | |
cvt.u64.u32 %rd161, %r7299; | |
bfe.u32 %r7300, %r2214, 16, 6; | |
mul.wide.u32 %rd2319, %r7299, 1792; | |
add.s64 %rd2320, %rd415, %rd2319; | |
mul.wide.u32 %rd2321, %r7300, 28; | |
add.s64 %rd2322, %rd2320, %rd2321; | |
ld.global.u32 %r7301, [%rd2322]; | |
and.b32 %r7302, %r7301, 65535; | |
bfe.u32 %r7303, %r7301, 16, 6; | |
mul.wide.u32 %rd2323, %r7302, 1792; | |
add.s64 %rd2324, %rd414, %rd2323; | |
mul.wide.u32 %rd2325, %r7303, 28; | |
add.s64 %rd2326, %rd2324, %rd2325; | |
ld.global.u32 %r7304, [%rd2326]; | |
and.b32 %r7305, %r7304, 65535; | |
shl.b32 %r7306, %r7305, 6; | |
bfe.u32 %r7307, %r7304, 16, 6; | |
or.b32 %r2215, %r7306, %r7307; | |
st.global.u32 [%rd153+16], %r2215; | |
bfe.u32 %r7308, %r7301, 22, 6; | |
mul.wide.u32 %rd2327, %r7308, 28; | |
add.s64 %rd2328, %rd2324, %rd2327; | |
ld.global.u32 %r7309, [%rd2328]; | |
and.b32 %r7310, %r7309, 65535; | |
shl.b32 %r7311, %r7310, 6; | |
bfe.u32 %r7312, %r7309, 16, 6; | |
or.b32 %r18048, %r7311, %r7312; | |
st.global.u32 [%rd153+20], %r18048; | |
setp.le.u32 %p278, %r2215, %r18048; | |
mov.u32 %r18047, %r2215; | |
@%p278 bra BB12_540; | |
st.global.u32 [%rd153+16], %r18048; | |
st.global.u32 [%rd153+20], %r2215; | |
mov.u32 %r17256, %r18048; | |
mov.u32 %r18048, %r2215; | |
mov.u32 %r18047, %r17256; | |
BB12_540: | |
mov.u32 %r18043, %r18047; | |
mov.u32 %r18044, %r18048; | |
bfe.u32 %r7313, %r2214, 22, 6; | |
mul.lo.s64 %rd2329, %rd161, 1792; | |
add.s64 %rd2330, %rd415, %rd2329; | |
mul.wide.u32 %rd2331, %r7313, 28; | |
add.s64 %rd2332, %rd2330, %rd2331; | |
ld.global.u32 %r7314, [%rd2332]; | |
and.b32 %r7315, %r7314, 65535; | |
bfe.u32 %r7316, %r7314, 16, 6; | |
mul.wide.u32 %rd2333, %r7315, 1792; | |
add.s64 %rd2334, %rd414, %rd2333; | |
mul.wide.u32 %rd2335, %r7316, 28; | |
add.s64 %rd2336, %rd2334, %rd2335; | |
ld.global.u32 %r7317, [%rd2336]; | |
and.b32 %r7318, %r7317, 65535; | |
shl.b32 %r7319, %r7318, 6; | |
bfe.u32 %r7320, %r7317, 16, 6; | |
or.b32 %r2219, %r7319, %r7320; | |
st.global.u32 [%rd153+24], %r2219; | |
bfe.u32 %r7321, %r7314, 22, 6; | |
mul.wide.u32 %rd2337, %r7321, 28; | |
add.s64 %rd2338, %rd2334, %rd2337; | |
ld.global.u32 %r7322, [%rd2338]; | |
and.b32 %r7323, %r7322, 65535; | |
shl.b32 %r7324, %r7323, 6; | |
bfe.u32 %r7325, %r7322, 16, 6; | |
or.b32 %r18050, %r7324, %r7325; | |
st.global.u32 [%rd153+28], %r18050; | |
setp.le.u32 %p279, %r2219, %r18050; | |
mov.u32 %r18049, %r2219; | |
@%p279 bra BB12_542; | |
st.global.u32 [%rd153+24], %r18050; | |
st.global.u32 [%rd153+28], %r2219; | |
mov.u32 %r17262, %r18050; | |
mov.u32 %r18050, %r2219; | |
mov.u32 %r18049, %r17262; | |
BB12_542: | |
mov.u32 %r2222, %r18049; | |
mov.u32 %r2221, %r18050; | |
setp.le.u32 %p280, %r18043, %r2222; | |
mov.u32 %r18045, %r2222; | |
mov.u32 %r18046, %r2221; | |
@%p280 bra BB12_544; | |
st.global.u32 [%rd153+16], %r2222; | |
st.global.u32 [%rd153+24], %r18043; | |
st.global.u32 [%rd153+20], %r2221; | |
st.global.u32 [%rd153+28], %r18044; | |
mov.u32 %r17259, %r18044; | |
mov.u32 %r17261, %r18043; | |
mov.u32 %r18044, %r2221; | |
mov.u32 %r18043, %r2222; | |
mov.u32 %r18045, %r17261; | |
mov.u32 %r18046, %r17259; | |
BB12_544: | |
mov.u32 %r2226, %r18043; | |
mov.u32 %r2225, %r18044; | |
mov.u32 %r2224, %r18045; | |
mov.u32 %r2223, %r18046; | |
setp.le.u32 %p281, %r18027, %r2226; | |
mov.u32 %r18031, %r2226; | |
mov.u32 %r18032, %r2225; | |
mov.u32 %r18033, %r2224; | |
mov.u32 %r18034, %r2223; | |
@%p281 bra BB12_546; | |
st.global.u32 [%rd153], %r2226; | |
st.global.u32 [%rd153+16], %r18027; | |
st.global.u32 [%rd153+4], %r2225; | |
st.global.u32 [%rd153+20], %r18028; | |
st.global.u32 [%rd153+8], %r2224; | |
st.global.u32 [%rd153+24], %r18029; | |
st.global.u32 [%rd153+12], %r2223; | |
st.global.u32 [%rd153+28], %r18030; | |
mov.u32 %r17249, %r18030; | |
mov.u32 %r17251, %r18029; | |
mov.u32 %r17253, %r18028; | |
mov.u32 %r17255, %r18027; | |
mov.u32 %r18030, %r2223; | |
mov.u32 %r18029, %r2224; | |
mov.u32 %r18028, %r2225; | |
mov.u32 %r18027, %r2226; | |
mov.u32 %r18031, %r17255; | |
mov.u32 %r18032, %r17253; | |
mov.u32 %r18033, %r17251; | |
mov.u32 %r18034, %r17249; | |
BB12_546: | |
mov.u32 %r18011, %r18027; | |
mov.u32 %r18012, %r18028; | |
mov.u32 %r18013, %r18029; | |
mov.u32 %r18014, %r18030; | |
mov.u32 %r18015, %r18031; | |
mov.u32 %r18016, %r18032; | |
mov.u32 %r18017, %r18033; | |
mov.u32 %r18018, %r18034; | |
mul.lo.s64 %rd2339, %rd158, 1792; | |
add.s64 %rd2340, %rd6, %rd2339; | |
bfe.u32 %r7326, %r2199, 22, 6; | |
mul.wide.u32 %rd2341, %r7326, 28; | |
add.s64 %rd2342, %rd2340, %rd2341; | |
ld.global.u32 %r2235, [%rd2342+-8]; | |
and.b32 %r7327, %r2235, 65535; | |
mul.wide.u32 %rd2343, %r7327, 1792; | |
add.s64 %rd2344, %rd4, %rd2343; | |
cvt.u64.u32 %rd162, %r7327; | |
bfe.u32 %r7328, %r2235, 16, 6; | |
mul.wide.u32 %rd2345, %r7328, 28; | |
add.s64 %rd2346, %rd2344, %rd2345; | |
ld.global.u32 %r2236, [%rd2346+-12]; | |
and.b32 %r7329, %r2236, 65535; | |
cvt.u64.u32 %rd163, %r7329; | |
bfe.u32 %r7330, %r2236, 16, 6; | |
mul.wide.u32 %rd2347, %r7329, 1792; | |
add.s64 %rd2348, %rd415, %rd2347; | |
mul.wide.u32 %rd2349, %r7330, 28; | |
add.s64 %rd2350, %rd2348, %rd2349; | |
ld.global.u32 %r7331, [%rd2350]; | |
and.b32 %r7332, %r7331, 65535; | |
bfe.u32 %r7333, %r7331, 16, 6; | |
mul.wide.u32 %rd2351, %r7332, 1792; | |
add.s64 %rd2352, %rd414, %rd2351; | |
mul.wide.u32 %rd2353, %r7333, 28; | |
add.s64 %rd2354, %rd2352, %rd2353; | |
ld.global.u32 %r7334, [%rd2354]; | |
and.b32 %r7335, %r7334, 65535; | |
shl.b32 %r7336, %r7335, 6; | |
bfe.u32 %r7337, %r7334, 16, 6; | |
or.b32 %r2237, %r7336, %r7337; | |
st.global.u32 [%rd153+32], %r2237; | |
bfe.u32 %r7338, %r7331, 22, 6; | |
mul.wide.u32 %rd2355, %r7338, 28; | |
add.s64 %rd2356, %rd2352, %rd2355; | |
ld.global.u32 %r7339, [%rd2356]; | |
and.b32 %r7340, %r7339, 65535; | |
shl.b32 %r7341, %r7340, 6; | |
bfe.u32 %r7342, %r7339, 16, 6; | |
or.b32 %r18064, %r7341, %r7342; | |
st.global.u32 [%rd153+36], %r18064; | |
setp.le.u32 %p282, %r2237, %r18064; | |
mov.u32 %r18063, %r2237; | |
@%p282 bra BB12_548; | |
st.global.u32 [%rd153+32], %r18064; | |
st.global.u32 [%rd153+36], %r2237; | |
mov.u32 %r17292, %r18064; | |
mov.u32 %r18064, %r2237; | |
mov.u32 %r18063, %r17292; | |
BB12_548: | |
mov.u32 %r18059, %r18063; | |
mov.u32 %r18060, %r18064; | |
bfe.u32 %r7343, %r2236, 22, 6; | |
mul.lo.s64 %rd2357, %rd163, 1792; | |
add.s64 %rd2358, %rd415, %rd2357; | |
mul.wide.u32 %rd2359, %r7343, 28; | |
add.s64 %rd2360, %rd2358, %rd2359; | |
ld.global.u32 %r7344, [%rd2360]; | |
and.b32 %r7345, %r7344, 65535; | |
bfe.u32 %r7346, %r7344, 16, 6; | |
mul.wide.u32 %rd2361, %r7345, 1792; | |
add.s64 %rd2362, %rd414, %rd2361; | |
mul.wide.u32 %rd2363, %r7346, 28; | |
add.s64 %rd2364, %rd2362, %rd2363; | |
ld.global.u32 %r7347, [%rd2364]; | |
and.b32 %r7348, %r7347, 65535; | |
shl.b32 %r7349, %r7348, 6; | |
bfe.u32 %r7350, %r7347, 16, 6; | |
or.b32 %r2241, %r7349, %r7350; | |
st.global.u32 [%rd153+40], %r2241; | |
bfe.u32 %r7351, %r7344, 22, 6; | |
mul.wide.u32 %rd2365, %r7351, 28; | |
add.s64 %rd2366, %rd2362, %rd2365; | |
ld.global.u32 %r7352, [%rd2366]; | |
and.b32 %r7353, %r7352, 65535; | |
shl.b32 %r7354, %r7353, 6; | |
bfe.u32 %r7355, %r7352, 16, 6; | |
or.b32 %r18066, %r7354, %r7355; | |
st.global.u32 [%rd153+44], %r18066; | |
setp.le.u32 %p283, %r2241, %r18066; | |
mov.u32 %r18065, %r2241; | |
@%p283 bra BB12_550; | |
st.global.u32 [%rd153+40], %r18066; | |
st.global.u32 [%rd153+44], %r2241; | |
mov.u32 %r17298, %r18066; | |
mov.u32 %r18066, %r2241; | |
mov.u32 %r18065, %r17298; | |
BB12_550: | |
mov.u32 %r2244, %r18065; | |
mov.u32 %r2243, %r18066; | |
setp.le.u32 %p284, %r18059, %r2244; | |
mov.u32 %r18061, %r2244; | |
mov.u32 %r18062, %r2243; | |
@%p284 bra BB12_552; | |
st.global.u32 [%rd153+32], %r2244; | |
st.global.u32 [%rd153+40], %r18059; | |
st.global.u32 [%rd153+36], %r2243; | |
st.global.u32 [%rd153+44], %r18060; | |
mov.u32 %r17295, %r18060; | |
mov.u32 %r17297, %r18059; | |
mov.u32 %r18060, %r2243; | |
mov.u32 %r18059, %r2244; | |
mov.u32 %r18061, %r17297; | |
mov.u32 %r18062, %r17295; | |
BB12_552: | |
mov.u32 %r18051, %r18059; | |
mov.u32 %r18052, %r18060; | |
mov.u32 %r18053, %r18061; | |
mov.u32 %r18054, %r18062; | |
mul.lo.s64 %rd2367, %rd162, 1792; | |
add.s64 %rd2368, %rd4, %rd2367; | |
bfe.u32 %r7356, %r2235, 22, 6; | |
mul.wide.u32 %rd2369, %r7356, 28; | |
add.s64 %rd2370, %rd2368, %rd2369; | |
ld.global.u32 %r2249, [%rd2370+-12]; | |
and.b32 %r7357, %r2249, 65535; | |
cvt.u64.u32 %rd164, %r7357; | |
bfe.u32 %r7358, %r2249, 16, 6; | |
mul.wide.u32 %rd2371, %r7357, 1792; | |
add.s64 %rd2372, %rd415, %rd2371; | |
mul.wide.u32 %rd2373, %r7358, 28; | |
add.s64 %rd2374, %rd2372, %rd2373; | |
ld.global.u32 %r7359, [%rd2374]; | |
and.b32 %r7360, %r7359, 65535; | |
bfe.u32 %r7361, %r7359, 16, 6; | |
mul.wide.u32 %rd2375, %r7360, 1792; | |
add.s64 %rd2376, %rd414, %rd2375; | |
mul.wide.u32 %rd2377, %r7361, 28; | |
add.s64 %rd2378, %rd2376, %rd2377; | |
ld.global.u32 %r7362, [%rd2378]; | |
and.b32 %r7363, %r7362, 65535; | |
shl.b32 %r7364, %r7363, 6; | |
bfe.u32 %r7365, %r7362, 16, 6; | |
or.b32 %r2250, %r7364, %r7365; | |
st.global.u32 [%rd153+48], %r2250; | |
bfe.u32 %r7366, %r7359, 22, 6; | |
mul.wide.u32 %rd2379, %r7366, 28; | |
add.s64 %rd2380, %rd2376, %rd2379; | |
ld.global.u32 %r7367, [%rd2380]; | |
and.b32 %r7368, %r7367, 65535; | |
shl.b32 %r7369, %r7368, 6; | |
bfe.u32 %r7370, %r7367, 16, 6; | |
or.b32 %r18072, %r7369, %r7370; | |
st.global.u32 [%rd153+52], %r18072; | |
setp.le.u32 %p285, %r2250, %r18072; | |
mov.u32 %r18071, %r2250; | |
@%p285 bra BB12_554; | |
st.global.u32 [%rd153+48], %r18072; | |
st.global.u32 [%rd153+52], %r2250; | |
mov.u32 %r17312, %r18072; | |
mov.u32 %r18072, %r2250; | |
mov.u32 %r18071, %r17312; | |
BB12_554: | |
mov.u32 %r18067, %r18071; | |
mov.u32 %r18068, %r18072; | |
bfe.u32 %r7371, %r2249, 22, 6; | |
mul.lo.s64 %rd2381, %rd164, 1792; | |
add.s64 %rd2382, %rd415, %rd2381; | |
mul.wide.u32 %rd2383, %r7371, 28; | |
add.s64 %rd2384, %rd2382, %rd2383; | |
ld.global.u32 %r7372, [%rd2384]; | |
and.b32 %r7373, %r7372, 65535; | |
bfe.u32 %r7374, %r7372, 16, 6; | |
mul.wide.u32 %rd2385, %r7373, 1792; | |
add.s64 %rd2386, %rd414, %rd2385; | |
mul.wide.u32 %rd2387, %r7374, 28; | |
add.s64 %rd2388, %rd2386, %rd2387; | |
ld.global.u32 %r7375, [%rd2388]; | |
and.b32 %r7376, %r7375, 65535; | |
shl.b32 %r7377, %r7376, 6; | |
bfe.u32 %r7378, %r7375, 16, 6; | |
or.b32 %r2254, %r7377, %r7378; | |
st.global.u32 [%rd153+56], %r2254; | |
bfe.u32 %r7379, %r7372, 22, 6; | |
mul.wide.u32 %rd2389, %r7379, 28; | |
add.s64 %rd2390, %rd2386, %rd2389; | |
ld.global.u32 %r7380, [%rd2390]; | |
and.b32 %r7381, %r7380, 65535; | |
shl.b32 %r7382, %r7381, 6; | |
bfe.u32 %r7383, %r7380, 16, 6; | |
or.b32 %r18074, %r7382, %r7383; | |
st.global.u32 [%rd153+60], %r18074; | |
setp.le.u32 %p286, %r2254, %r18074; | |
mov.u32 %r18073, %r2254; | |
@%p286 bra BB12_556; | |
st.global.u32 [%rd153+56], %r18074; | |
st.global.u32 [%rd153+60], %r2254; | |
mov.u32 %r17318, %r18074; | |
mov.u32 %r18074, %r2254; | |
mov.u32 %r18073, %r17318; | |
BB12_556: | |
mov.u32 %r2257, %r18073; | |
mov.u32 %r2256, %r18074; | |
setp.le.u32 %p287, %r18067, %r2257; | |
mov.u32 %r18069, %r2257; | |
mov.u32 %r18070, %r2256; | |
@%p287 bra BB12_558; | |
st.global.u32 [%rd153+48], %r2257; | |
st.global.u32 [%rd153+56], %r18067; | |
st.global.u32 [%rd153+52], %r2256; | |
st.global.u32 [%rd153+60], %r18068; | |
mov.u32 %r17315, %r18068; | |
mov.u32 %r17317, %r18067; | |
mov.u32 %r18068, %r2256; | |
mov.u32 %r18067, %r2257; | |
mov.u32 %r18069, %r17317; | |
mov.u32 %r18070, %r17315; | |
BB12_558: | |
mov.u32 %r2261, %r18067; | |
mov.u32 %r2260, %r18068; | |
mov.u32 %r2259, %r18069; | |
mov.u32 %r2258, %r18070; | |
setp.le.u32 %p288, %r18051, %r2261; | |
mov.u32 %r18055, %r2261; | |
mov.u32 %r18056, %r2260; | |
mov.u32 %r18057, %r2259; | |
mov.u32 %r18058, %r2258; | |
@%p288 bra BB12_560; | |
st.global.u32 [%rd153+32], %r2261; | |
st.global.u32 [%rd153+48], %r18051; | |
st.global.u32 [%rd153+36], %r2260; | |
st.global.u32 [%rd153+52], %r18052; | |
st.global.u32 [%rd153+40], %r2259; | |
st.global.u32 [%rd153+56], %r18053; | |
st.global.u32 [%rd153+44], %r2258; | |
st.global.u32 [%rd153+60], %r18054; | |
mov.u32 %r17305, %r18054; | |
mov.u32 %r17307, %r18053; | |
mov.u32 %r17309, %r18052; | |
mov.u32 %r17311, %r18051; | |
mov.u32 %r18054, %r2258; | |
mov.u32 %r18053, %r2259; | |
mov.u32 %r18052, %r2260; | |
mov.u32 %r18051, %r2261; | |
mov.u32 %r18055, %r17311; | |
mov.u32 %r18056, %r17309; | |
mov.u32 %r18057, %r17307; | |
mov.u32 %r18058, %r17305; | |
BB12_560: | |
mov.u32 %r2269, %r18051; | |
mov.u32 %r2268, %r18052; | |
mov.u32 %r2267, %r18053; | |
mov.u32 %r2266, %r18054; | |
mov.u32 %r2265, %r18055; | |
mov.u32 %r2264, %r18056; | |
mov.u32 %r2263, %r18057; | |
mov.u32 %r2262, %r18058; | |
setp.le.u32 %p289, %r18011, %r2269; | |
mov.u32 %r18019, %r2269; | |
mov.u32 %r18020, %r2268; | |
mov.u32 %r18021, %r2267; | |
mov.u32 %r18022, %r2266; | |
mov.u32 %r18023, %r2265; | |
mov.u32 %r18024, %r2264; | |
mov.u32 %r18025, %r2263; | |
mov.u32 %r18026, %r2262; | |
@%p289 bra BB12_562; | |
st.global.u32 [%rd153], %r2269; | |
st.global.u32 [%rd153+32], %r18011; | |
st.global.u32 [%rd153+4], %r2268; | |
st.global.u32 [%rd153+36], %r18012; | |
st.global.u32 [%rd153+8], %r2267; | |
st.global.u32 [%rd153+40], %r18013; | |
st.global.u32 [%rd153+12], %r2266; | |
st.global.u32 [%rd153+44], %r18014; | |
st.global.u32 [%rd153+16], %r2265; | |
st.global.u32 [%rd153+48], %r18015; | |
st.global.u32 [%rd153+20], %r2264; | |
st.global.u32 [%rd153+52], %r18016; | |
st.global.u32 [%rd153+24], %r2263; | |
st.global.u32 [%rd153+56], %r18017; | |
st.global.u32 [%rd153+28], %r2262; | |
st.global.u32 [%rd153+60], %r18018; | |
mov.u32 %r17277, %r18018; | |
mov.u32 %r17279, %r18017; | |
mov.u32 %r17281, %r18016; | |
mov.u32 %r17283, %r18015; | |
mov.u32 %r17285, %r18014; | |
mov.u32 %r17287, %r18013; | |
mov.u32 %r17289, %r18012; | |
mov.u32 %r17291, %r18011; | |
mov.u32 %r18018, %r2262; | |
mov.u32 %r18017, %r2263; | |
mov.u32 %r18016, %r2264; | |
mov.u32 %r18015, %r2265; | |
mov.u32 %r18014, %r2266; | |
mov.u32 %r18013, %r2267; | |
mov.u32 %r18012, %r2268; | |
mov.u32 %r18011, %r2269; | |
mov.u32 %r18019, %r17291; | |
mov.u32 %r18020, %r17289; | |
mov.u32 %r18021, %r17287; | |
mov.u32 %r18022, %r17285; | |
mov.u32 %r18023, %r17283; | |
mov.u32 %r18024, %r17281; | |
mov.u32 %r18025, %r17279; | |
mov.u32 %r18026, %r17277; | |
BB12_562: | |
mov.u32 %r17979, %r18011; | |
mov.u32 %r17980, %r18012; | |
mov.u32 %r17981, %r18013; | |
mov.u32 %r17982, %r18014; | |
mov.u32 %r17983, %r18015; | |
mov.u32 %r17984, %r18016; | |
mov.u32 %r17985, %r18017; | |
mov.u32 %r17986, %r18018; | |
mov.u32 %r17987, %r18019; | |
mov.u32 %r17988, %r18020; | |
mov.u32 %r17989, %r18021; | |
mov.u32 %r17990, %r18022; | |
mov.u32 %r17991, %r18023; | |
mov.u32 %r17992, %r18024; | |
mov.u32 %r17993, %r18025; | |
mov.u32 %r17994, %r18026; | |
mul.lo.s64 %rd2391, %rd157, 1792; | |
add.s64 %rd2392, %rd4, %rd2391; | |
bfe.u32 %r7384, %r2198, 22, 6; | |
mul.wide.u32 %rd2393, %r7384, 28; | |
add.s64 %rd2394, %rd2392, %rd2393; | |
ld.global.u32 %r2286, [%rd2394+-8]; | |
and.b32 %r7385, %r2286, 65535; | |
mul.wide.u32 %rd2395, %r7385, 1792; | |
add.s64 %rd2396, %rd6, %rd2395; | |
bfe.u32 %r7386, %r2286, 16, 6; | |
mul.wide.u32 %rd2397, %r7386, 28; | |
add.s64 %rd2398, %rd2396, %rd2397; | |
ld.global.u32 %r2287, [%rd2398+-8]; | |
and.b32 %r7387, %r2287, 65535; | |
mul.wide.u32 %rd2399, %r7387, 1792; | |
add.s64 %rd2400, %rd4, %rd2399; | |
cvt.u64.u32 %rd165, %r7385; | |
cvt.u64.u32 %rd166, %r7387; | |
bfe.u32 %r7388, %r2287, 16, 6; | |
mul.wide.u32 %rd2401, %r7388, 28; | |
add.s64 %rd2402, %rd2400, %rd2401; | |
ld.global.u32 %r2288, [%rd2402+-12]; | |
and.b32 %r7389, %r2288, 65535; | |
cvt.u64.u32 %rd167, %r7389; | |
bfe.u32 %r7390, %r2288, 16, 6; | |
mul.wide.u32 %rd2403, %r7389, 1792; | |
add.s64 %rd2404, %rd415, %rd2403; | |
mul.wide.u32 %rd2405, %r7390, 28; | |
add.s64 %rd2406, %rd2404, %rd2405; | |
ld.global.u32 %r7391, [%rd2406]; | |
and.b32 %r7392, %r7391, 65535; | |
bfe.u32 %r7393, %r7391, 16, 6; | |
mul.wide.u32 %rd2407, %r7392, 1792; | |
add.s64 %rd2408, %rd414, %rd2407; | |
mul.wide.u32 %rd2409, %r7393, 28; | |
add.s64 %rd2410, %rd2408, %rd2409; | |
ld.global.u32 %r7394, [%rd2410]; | |
and.b32 %r7395, %r7394, 65535; | |
shl.b32 %r7396, %r7395, 6; | |
bfe.u32 %r7397, %r7394, 16, 6; | |
or.b32 %r2289, %r7396, %r7397; | |
st.global.u32 [%rd153+64], %r2289; | |
bfe.u32 %r7398, %r7391, 22, 6; | |
mul.wide.u32 %rd2411, %r7398, 28; | |
add.s64 %rd2412, %rd2408, %rd2411; | |
ld.global.u32 %r7399, [%rd2412]; | |
and.b32 %r7400, %r7399, 65535; | |
shl.b32 %r7401, %r7400, 6; | |
bfe.u32 %r7402, %r7399, 16, 6; | |
or.b32 %r18104, %r7401, %r7402; | |
st.global.u32 [%rd153+68], %r18104; | |
setp.le.u32 %p290, %r2289, %r18104; | |
mov.u32 %r18103, %r2289; | |
@%p290 bra BB12_564; | |
st.global.u32 [%rd153+64], %r18104; | |
st.global.u32 [%rd153+68], %r2289; | |
mov.u32 %r17380, %r18104; | |
mov.u32 %r18104, %r2289; | |
mov.u32 %r18103, %r17380; | |
BB12_564: | |
mov.u32 %r18099, %r18103; | |
mov.u32 %r18100, %r18104; | |
bfe.u32 %r7403, %r2288, 22, 6; | |
mul.lo.s64 %rd2413, %rd167, 1792; | |
add.s64 %rd2414, %rd415, %rd2413; | |
mul.wide.u32 %rd2415, %r7403, 28; | |
add.s64 %rd2416, %rd2414, %rd2415; | |
ld.global.u32 %r7404, [%rd2416]; | |
and.b32 %r7405, %r7404, 65535; | |
bfe.u32 %r7406, %r7404, 16, 6; | |
mul.wide.u32 %rd2417, %r7405, 1792; | |
add.s64 %rd2418, %rd414, %rd2417; | |
mul.wide.u32 %rd2419, %r7406, 28; | |
add.s64 %rd2420, %rd2418, %rd2419; | |
ld.global.u32 %r7407, [%rd2420]; | |
and.b32 %r7408, %r7407, 65535; | |
shl.b32 %r7409, %r7408, 6; | |
bfe.u32 %r7410, %r7407, 16, 6; | |
or.b32 %r2293, %r7409, %r7410; | |
st.global.u32 [%rd153+72], %r2293; | |
bfe.u32 %r7411, %r7404, 22, 6; | |
mul.wide.u32 %rd2421, %r7411, 28; | |
add.s64 %rd2422, %rd2418, %rd2421; | |
ld.global.u32 %r7412, [%rd2422]; | |
and.b32 %r7413, %r7412, 65535; | |
shl.b32 %r7414, %r7413, 6; | |
bfe.u32 %r7415, %r7412, 16, 6; | |
or.b32 %r18106, %r7414, %r7415; | |
st.global.u32 [%rd153+76], %r18106; | |
setp.le.u32 %p291, %r2293, %r18106; | |
mov.u32 %r18105, %r2293; | |
@%p291 bra BB12_566; | |
st.global.u32 [%rd153+72], %r18106; | |
st.global.u32 [%rd153+76], %r2293; | |
mov.u32 %r17386, %r18106; | |
mov.u32 %r18106, %r2293; | |
mov.u32 %r18105, %r17386; | |
BB12_566: | |
mov.u32 %r2296, %r18105; | |
mov.u32 %r2295, %r18106; | |
setp.le.u32 %p292, %r18099, %r2296; | |
mov.u32 %r18101, %r2296; | |
mov.u32 %r18102, %r2295; | |
@%p292 bra BB12_568; | |
st.global.u32 [%rd153+64], %r2296; | |
st.global.u32 [%rd153+72], %r18099; | |
st.global.u32 [%rd153+68], %r2295; | |
st.global.u32 [%rd153+76], %r18100; | |
mov.u32 %r17383, %r18100; | |
mov.u32 %r17385, %r18099; | |
mov.u32 %r18100, %r2295; | |
mov.u32 %r18099, %r2296; | |
mov.u32 %r18101, %r17385; | |
mov.u32 %r18102, %r17383; | |
BB12_568: | |
mov.u32 %r18091, %r18099; | |
mov.u32 %r18092, %r18100; | |
mov.u32 %r18093, %r18101; | |
mov.u32 %r18094, %r18102; | |
mul.lo.s64 %rd2423, %rd166, 1792; | |
add.s64 %rd2424, %rd4, %rd2423; | |
bfe.u32 %r7416, %r2287, 22, 6; | |
mul.wide.u32 %rd2425, %r7416, 28; | |
add.s64 %rd2426, %rd2424, %rd2425; | |
ld.global.u32 %r2301, [%rd2426+-12]; | |
and.b32 %r7417, %r2301, 65535; | |
cvt.u64.u32 %rd168, %r7417; | |
bfe.u32 %r7418, %r2301, 16, 6; | |
mul.wide.u32 %rd2427, %r7417, 1792; | |
add.s64 %rd2428, %rd415, %rd2427; | |
mul.wide.u32 %rd2429, %r7418, 28; | |
add.s64 %rd2430, %rd2428, %rd2429; | |
ld.global.u32 %r7419, [%rd2430]; | |
and.b32 %r7420, %r7419, 65535; | |
bfe.u32 %r7421, %r7419, 16, 6; | |
mul.wide.u32 %rd2431, %r7420, 1792; | |
add.s64 %rd2432, %rd414, %rd2431; | |
mul.wide.u32 %rd2433, %r7421, 28; | |
add.s64 %rd2434, %rd2432, %rd2433; | |
ld.global.u32 %r7422, [%rd2434]; | |
and.b32 %r7423, %r7422, 65535; | |
shl.b32 %r7424, %r7423, 6; | |
bfe.u32 %r7425, %r7422, 16, 6; | |
or.b32 %r2302, %r7424, %r7425; | |
st.global.u32 [%rd153+80], %r2302; | |
bfe.u32 %r7426, %r7419, 22, 6; | |
mul.wide.u32 %rd2435, %r7426, 28; | |
add.s64 %rd2436, %rd2432, %rd2435; | |
ld.global.u32 %r7427, [%rd2436]; | |
and.b32 %r7428, %r7427, 65535; | |
shl.b32 %r7429, %r7428, 6; | |
bfe.u32 %r7430, %r7427, 16, 6; | |
or.b32 %r18112, %r7429, %r7430; | |
st.global.u32 [%rd153+84], %r18112; | |
setp.le.u32 %p293, %r2302, %r18112; | |
mov.u32 %r18111, %r2302; | |
@%p293 bra BB12_570; | |
st.global.u32 [%rd153+80], %r18112; | |
st.global.u32 [%rd153+84], %r2302; | |
mov.u32 %r17400, %r18112; | |
mov.u32 %r18112, %r2302; | |
mov.u32 %r18111, %r17400; | |
BB12_570: | |
mov.u32 %r18107, %r18111; | |
mov.u32 %r18108, %r18112; | |
bfe.u32 %r7431, %r2301, 22, 6; | |
mul.lo.s64 %rd2437, %rd168, 1792; | |
add.s64 %rd2438, %rd415, %rd2437; | |
mul.wide.u32 %rd2439, %r7431, 28; | |
add.s64 %rd2440, %rd2438, %rd2439; | |
ld.global.u32 %r7432, [%rd2440]; | |
and.b32 %r7433, %r7432, 65535; | |
bfe.u32 %r7434, %r7432, 16, 6; | |
mul.wide.u32 %rd2441, %r7433, 1792; | |
add.s64 %rd2442, %rd414, %rd2441; | |
mul.wide.u32 %rd2443, %r7434, 28; | |
add.s64 %rd2444, %rd2442, %rd2443; | |
ld.global.u32 %r7435, [%rd2444]; | |
and.b32 %r7436, %r7435, 65535; | |
shl.b32 %r7437, %r7436, 6; | |
bfe.u32 %r7438, %r7435, 16, 6; | |
or.b32 %r2306, %r7437, %r7438; | |
st.global.u32 [%rd153+88], %r2306; | |
bfe.u32 %r7439, %r7432, 22, 6; | |
mul.wide.u32 %rd2445, %r7439, 28; | |
add.s64 %rd2446, %rd2442, %rd2445; | |
ld.global.u32 %r7440, [%rd2446]; | |
and.b32 %r7441, %r7440, 65535; | |
shl.b32 %r7442, %r7441, 6; | |
bfe.u32 %r7443, %r7440, 16, 6; | |
or.b32 %r18114, %r7442, %r7443; | |
st.global.u32 [%rd153+92], %r18114; | |
setp.le.u32 %p294, %r2306, %r18114; | |
mov.u32 %r18113, %r2306; | |
@%p294 bra BB12_572; | |
st.global.u32 [%rd153+88], %r18114; | |
st.global.u32 [%rd153+92], %r2306; | |
mov.u32 %r17406, %r18114; | |
mov.u32 %r18114, %r2306; | |
mov.u32 %r18113, %r17406; | |
BB12_572: | |
mov.u32 %r2309, %r18113; | |
mov.u32 %r2308, %r18114; | |
setp.le.u32 %p295, %r18107, %r2309; | |
mov.u32 %r18109, %r2309; | |
mov.u32 %r18110, %r2308; | |
@%p295 bra BB12_574; | |
st.global.u32 [%rd153+80], %r2309; | |
st.global.u32 [%rd153+88], %r18107; | |
st.global.u32 [%rd153+84], %r2308; | |
st.global.u32 [%rd153+92], %r18108; | |
mov.u32 %r17403, %r18108; | |
mov.u32 %r17405, %r18107; | |
mov.u32 %r18108, %r2308; | |
mov.u32 %r18107, %r2309; | |
mov.u32 %r18109, %r17405; | |
mov.u32 %r18110, %r17403; | |
BB12_574: | |
mov.u32 %r2313, %r18107; | |
mov.u32 %r2312, %r18108; | |
mov.u32 %r2311, %r18109; | |
mov.u32 %r2310, %r18110; | |
setp.le.u32 %p296, %r18091, %r2313; | |
mov.u32 %r18095, %r2313; | |
mov.u32 %r18096, %r2312; | |
mov.u32 %r18097, %r2311; | |
mov.u32 %r18098, %r2310; | |
@%p296 bra BB12_576; | |
st.global.u32 [%rd153+64], %r2313; | |
st.global.u32 [%rd153+80], %r18091; | |
st.global.u32 [%rd153+68], %r2312; | |
st.global.u32 [%rd153+84], %r18092; | |
st.global.u32 [%rd153+72], %r2311; | |
st.global.u32 [%rd153+88], %r18093; | |
st.global.u32 [%rd153+76], %r2310; | |
st.global.u32 [%rd153+92], %r18094; | |
mov.u32 %r17393, %r18094; | |
mov.u32 %r17395, %r18093; | |
mov.u32 %r17397, %r18092; | |
mov.u32 %r17399, %r18091; | |
mov.u32 %r18094, %r2310; | |
mov.u32 %r18093, %r2311; | |
mov.u32 %r18092, %r2312; | |
mov.u32 %r18091, %r2313; | |
mov.u32 %r18095, %r17399; | |
mov.u32 %r18096, %r17397; | |
mov.u32 %r18097, %r17395; | |
mov.u32 %r18098, %r17393; | |
BB12_576: | |
mov.u32 %r18075, %r18091; | |
mov.u32 %r18076, %r18092; | |
mov.u32 %r18077, %r18093; | |
mov.u32 %r18078, %r18094; | |
mov.u32 %r18079, %r18095; | |
mov.u32 %r18080, %r18096; | |
mov.u32 %r18081, %r18097; | |
mov.u32 %r18082, %r18098; | |
mul.lo.s64 %rd2447, %rd165, 1792; | |
add.s64 %rd2448, %rd6, %rd2447; | |
bfe.u32 %r7444, %r2286, 22, 6; | |
mul.wide.u32 %rd2449, %r7444, 28; | |
add.s64 %rd2450, %rd2448, %rd2449; | |
ld.global.u32 %r2322, [%rd2450+-8]; | |
and.b32 %r7445, %r2322, 65535; | |
mul.wide.u32 %rd2451, %r7445, 1792; | |
add.s64 %rd2452, %rd4, %rd2451; | |
cvt.u64.u32 %rd169, %r7445; | |
bfe.u32 %r7446, %r2322, 16, 6; | |
mul.wide.u32 %rd2453, %r7446, 28; | |
add.s64 %rd2454, %rd2452, %rd2453; | |
ld.global.u32 %r2323, [%rd2454+-12]; | |
and.b32 %r7447, %r2323, 65535; | |
cvt.u64.u32 %rd170, %r7447; | |
bfe.u32 %r7448, %r2323, 16, 6; | |
mul.wide.u32 %rd2455, %r7447, 1792; | |
add.s64 %rd2456, %rd415, %rd2455; | |
mul.wide.u32 %rd2457, %r7448, 28; | |
add.s64 %rd2458, %rd2456, %rd2457; | |
ld.global.u32 %r7449, [%rd2458]; | |
and.b32 %r7450, %r7449, 65535; | |
bfe.u32 %r7451, %r7449, 16, 6; | |
mul.wide.u32 %rd2459, %r7450, 1792; | |
add.s64 %rd2460, %rd414, %rd2459; | |
mul.wide.u32 %rd2461, %r7451, 28; | |
add.s64 %rd2462, %rd2460, %rd2461; | |
ld.global.u32 %r7452, [%rd2462]; | |
and.b32 %r7453, %r7452, 65535; | |
shl.b32 %r7454, %r7453, 6; | |
bfe.u32 %r7455, %r7452, 16, 6; | |
or.b32 %r2324, %r7454, %r7455; | |
st.global.u32 [%rd153+96], %r2324; | |
bfe.u32 %r7456, %r7449, 22, 6; | |
mul.wide.u32 %rd2463, %r7456, 28; | |
add.s64 %rd2464, %rd2460, %rd2463; | |
ld.global.u32 %r7457, [%rd2464]; | |
and.b32 %r7458, %r7457, 65535; | |
shl.b32 %r7459, %r7458, 6; | |
bfe.u32 %r7460, %r7457, 16, 6; | |
or.b32 %r18128, %r7459, %r7460; | |
st.global.u32 [%rd153+100], %r18128; | |
setp.le.u32 %p297, %r2324, %r18128; | |
mov.u32 %r18127, %r2324; | |
@%p297 bra BB12_578; | |
st.global.u32 [%rd153+96], %r18128; | |
st.global.u32 [%rd153+100], %r2324; | |
mov.u32 %r17436, %r18128; | |
mov.u32 %r18128, %r2324; | |
mov.u32 %r18127, %r17436; | |
BB12_578: | |
mov.u32 %r18123, %r18127; | |
mov.u32 %r18124, %r18128; | |
bfe.u32 %r7461, %r2323, 22, 6; | |
mul.lo.s64 %rd2465, %rd170, 1792; | |
add.s64 %rd2466, %rd415, %rd2465; | |
mul.wide.u32 %rd2467, %r7461, 28; | |
add.s64 %rd2468, %rd2466, %rd2467; | |
ld.global.u32 %r7462, [%rd2468]; | |
and.b32 %r7463, %r7462, 65535; | |
bfe.u32 %r7464, %r7462, 16, 6; | |
mul.wide.u32 %rd2469, %r7463, 1792; | |
add.s64 %rd2470, %rd414, %rd2469; | |
mul.wide.u32 %rd2471, %r7464, 28; | |
add.s64 %rd2472, %rd2470, %rd2471; | |
ld.global.u32 %r7465, [%rd2472]; | |
and.b32 %r7466, %r7465, 65535; | |
shl.b32 %r7467, %r7466, 6; | |
bfe.u32 %r7468, %r7465, 16, 6; | |
or.b32 %r2328, %r7467, %r7468; | |
st.global.u32 [%rd153+104], %r2328; | |
bfe.u32 %r7469, %r7462, 22, 6; | |
mul.wide.u32 %rd2473, %r7469, 28; | |
add.s64 %rd2474, %rd2470, %rd2473; | |
ld.global.u32 %r7470, [%rd2474]; | |
and.b32 %r7471, %r7470, 65535; | |
shl.b32 %r7472, %r7471, 6; | |
bfe.u32 %r7473, %r7470, 16, 6; | |
or.b32 %r18130, %r7472, %r7473; | |
st.global.u32 [%rd153+108], %r18130; | |
setp.le.u32 %p298, %r2328, %r18130; | |
mov.u32 %r18129, %r2328; | |
@%p298 bra BB12_580; | |
st.global.u32 [%rd153+104], %r18130; | |
st.global.u32 [%rd153+108], %r2328; | |
mov.u32 %r17442, %r18130; | |
mov.u32 %r18130, %r2328; | |
mov.u32 %r18129, %r17442; | |
BB12_580: | |
mov.u32 %r2331, %r18129; | |
mov.u32 %r2330, %r18130; | |
setp.le.u32 %p299, %r18123, %r2331; | |
mov.u32 %r18125, %r2331; | |
mov.u32 %r18126, %r2330; | |
@%p299 bra BB12_582; | |
st.global.u32 [%rd153+96], %r2331; | |
st.global.u32 [%rd153+104], %r18123; | |
st.global.u32 [%rd153+100], %r2330; | |
st.global.u32 [%rd153+108], %r18124; | |
mov.u32 %r17439, %r18124; | |
mov.u32 %r17441, %r18123; | |
mov.u32 %r18124, %r2330; | |
mov.u32 %r18123, %r2331; | |
mov.u32 %r18125, %r17441; | |
mov.u32 %r18126, %r17439; | |
BB12_582: | |
mov.u32 %r18115, %r18123; | |
mov.u32 %r18116, %r18124; | |
mov.u32 %r18117, %r18125; | |
mov.u32 %r18118, %r18126; | |
mul.lo.s64 %rd2475, %rd169, 1792; | |
add.s64 %rd2476, %rd4, %rd2475; | |
bfe.u32 %r7474, %r2322, 22, 6; | |
mul.wide.u32 %rd2477, %r7474, 28; | |
add.s64 %rd2478, %rd2476, %rd2477; | |
ld.global.u32 %r2336, [%rd2478+-12]; | |
and.b32 %r7475, %r2336, 65535; | |
cvt.u64.u32 %rd171, %r7475; | |
bfe.u32 %r7476, %r2336, 16, 6; | |
mul.wide.u32 %rd2479, %r7475, 1792; | |
add.s64 %rd2480, %rd415, %rd2479; | |
mul.wide.u32 %rd2481, %r7476, 28; | |
add.s64 %rd2482, %rd2480, %rd2481; | |
ld.global.u32 %r7477, [%rd2482]; | |
and.b32 %r7478, %r7477, 65535; | |
bfe.u32 %r7479, %r7477, 16, 6; | |
mul.wide.u32 %rd2483, %r7478, 1792; | |
add.s64 %rd2484, %rd414, %rd2483; | |
mul.wide.u32 %rd2485, %r7479, 28; | |
add.s64 %rd2486, %rd2484, %rd2485; | |
ld.global.u32 %r7480, [%rd2486]; | |
and.b32 %r7481, %r7480, 65535; | |
shl.b32 %r7482, %r7481, 6; | |
bfe.u32 %r7483, %r7480, 16, 6; | |
or.b32 %r2337, %r7482, %r7483; | |
st.global.u32 [%rd153+112], %r2337; | |
bfe.u32 %r7484, %r7477, 22, 6; | |
mul.wide.u32 %rd2487, %r7484, 28; | |
add.s64 %rd2488, %rd2484, %rd2487; | |
ld.global.u32 %r7485, [%rd2488]; | |
and.b32 %r7486, %r7485, 65535; | |
shl.b32 %r7487, %r7486, 6; | |
bfe.u32 %r7488, %r7485, 16, 6; | |
or.b32 %r18136, %r7487, %r7488; | |
st.global.u32 [%rd153+116], %r18136; | |
setp.le.u32 %p300, %r2337, %r18136; | |
mov.u32 %r18135, %r2337; | |
@%p300 bra BB12_584; | |
st.global.u32 [%rd153+112], %r18136; | |
st.global.u32 [%rd153+116], %r2337; | |
mov.u32 %r17456, %r18136; | |
mov.u32 %r18136, %r2337; | |
mov.u32 %r18135, %r17456; | |
BB12_584: | |
mov.u32 %r18131, %r18135; | |
mov.u32 %r18132, %r18136; | |
bfe.u32 %r7489, %r2336, 22, 6; | |
mul.lo.s64 %rd2489, %rd171, 1792; | |
add.s64 %rd2490, %rd415, %rd2489; | |
mul.wide.u32 %rd2491, %r7489, 28; | |
add.s64 %rd2492, %rd2490, %rd2491; | |
ld.global.u32 %r7490, [%rd2492]; | |
and.b32 %r7491, %r7490, 65535; | |
bfe.u32 %r7492, %r7490, 16, 6; | |
mul.wide.u32 %rd2493, %r7491, 1792; | |
add.s64 %rd2494, %rd414, %rd2493; | |
mul.wide.u32 %rd2495, %r7492, 28; | |
add.s64 %rd2496, %rd2494, %rd2495; | |
ld.global.u32 %r7493, [%rd2496]; | |
and.b32 %r7494, %r7493, 65535; | |
shl.b32 %r7495, %r7494, 6; | |
bfe.u32 %r7496, %r7493, 16, 6; | |
or.b32 %r2341, %r7495, %r7496; | |
st.global.u32 [%rd153+120], %r2341; | |
bfe.u32 %r7497, %r7490, 22, 6; | |
mul.wide.u32 %rd2497, %r7497, 28; | |
add.s64 %rd2498, %rd2494, %rd2497; | |
ld.global.u32 %r7498, [%rd2498]; | |
and.b32 %r7499, %r7498, 65535; | |
shl.b32 %r7500, %r7499, 6; | |
bfe.u32 %r7501, %r7498, 16, 6; | |
or.b32 %r18138, %r7500, %r7501; | |
st.global.u32 [%rd153+124], %r18138; | |
setp.le.u32 %p301, %r2341, %r18138; | |
mov.u32 %r18137, %r2341; | |
@%p301 bra BB12_586; | |
st.global.u32 [%rd153+120], %r18138; | |
st.global.u32 [%rd153+124], %r2341; | |
mov.u32 %r17462, %r18138; | |
mov.u32 %r18138, %r2341; | |
mov.u32 %r18137, %r17462; | |
BB12_586: | |
mov.u32 %r2344, %r18137; | |
mov.u32 %r2343, %r18138; | |
setp.le.u32 %p302, %r18131, %r2344; | |
mov.u32 %r18133, %r2344; | |
mov.u32 %r18134, %r2343; | |
@%p302 bra BB12_588; | |
st.global.u32 [%rd153+112], %r2344; | |
st.global.u32 [%rd153+120], %r18131; | |
st.global.u32 [%rd153+116], %r2343; | |
st.global.u32 [%rd153+124], %r18132; | |
mov.u32 %r17459, %r18132; | |
mov.u32 %r17461, %r18131; | |
mov.u32 %r18132, %r2343; | |
mov.u32 %r18131, %r2344; | |
mov.u32 %r18133, %r17461; | |
mov.u32 %r18134, %r17459; | |
BB12_588: | |
mov.u32 %r2348, %r18131; | |
mov.u32 %r2347, %r18132; | |
mov.u32 %r2346, %r18133; | |
mov.u32 %r2345, %r18134; | |
setp.le.u32 %p303, %r18115, %r2348; | |
mov.u32 %r18119, %r2348; | |
mov.u32 %r18120, %r2347; | |
mov.u32 %r18121, %r2346; | |
mov.u32 %r18122, %r2345; | |
@%p303 bra BB12_590; | |
st.global.u32 [%rd153+96], %r2348; | |
st.global.u32 [%rd153+112], %r18115; | |
st.global.u32 [%rd153+100], %r2347; | |
st.global.u32 [%rd153+116], %r18116; | |
st.global.u32 [%rd153+104], %r2346; | |
st.global.u32 [%rd153+120], %r18117; | |
st.global.u32 [%rd153+108], %r2345; | |
st.global.u32 [%rd153+124], %r18118; | |
mov.u32 %r17449, %r18118; | |
mov.u32 %r17451, %r18117; | |
mov.u32 %r17453, %r18116; | |
mov.u32 %r17455, %r18115; | |
mov.u32 %r18118, %r2345; | |
mov.u32 %r18117, %r2346; | |
mov.u32 %r18116, %r2347; | |
mov.u32 %r18115, %r2348; | |
mov.u32 %r18119, %r17455; | |
mov.u32 %r18120, %r17453; | |
mov.u32 %r18121, %r17451; | |
mov.u32 %r18122, %r17449; | |
BB12_590: | |
mov.u32 %r2356, %r18115; | |
mov.u32 %r2355, %r18116; | |
mov.u32 %r2354, %r18117; | |
mov.u32 %r2353, %r18118; | |
mov.u32 %r2352, %r18119; | |
mov.u32 %r2351, %r18120; | |
mov.u32 %r2350, %r18121; | |
mov.u32 %r2349, %r18122; | |
setp.le.u32 %p304, %r18075, %r2356; | |
mov.u32 %r18083, %r2356; | |
mov.u32 %r18084, %r2355; | |
mov.u32 %r18085, %r2354; | |
mov.u32 %r18086, %r2353; | |
mov.u32 %r18087, %r2352; | |
mov.u32 %r18088, %r2351; | |
mov.u32 %r18089, %r2350; | |
mov.u32 %r18090, %r2349; | |
@%p304 bra BB12_592; | |
st.global.u32 [%rd153+64], %r2356; | |
st.global.u32 [%rd153+96], %r18075; | |
st.global.u32 [%rd153+68], %r2355; | |
st.global.u32 [%rd153+100], %r18076; | |
st.global.u32 [%rd153+72], %r2354; | |
st.global.u32 [%rd153+104], %r18077; | |
st.global.u32 [%rd153+76], %r2353; | |
st.global.u32 [%rd153+108], %r18078; | |
st.global.u32 [%rd153+80], %r2352; | |
st.global.u32 [%rd153+112], %r18079; | |
st.global.u32 [%rd153+84], %r2351; | |
st.global.u32 [%rd153+116], %r18080; | |
st.global.u32 [%rd153+88], %r2350; | |
st.global.u32 [%rd153+120], %r18081; | |
st.global.u32 [%rd153+92], %r2349; | |
st.global.u32 [%rd153+124], %r18082; | |
mov.u32 %r17421, %r18082; | |
mov.u32 %r17423, %r18081; | |
mov.u32 %r17425, %r18080; | |
mov.u32 %r17427, %r18079; | |
mov.u32 %r17429, %r18078; | |
mov.u32 %r17431, %r18077; | |
mov.u32 %r17433, %r18076; | |
mov.u32 %r17435, %r18075; | |
mov.u32 %r18082, %r2349; | |
mov.u32 %r18081, %r2350; | |
mov.u32 %r18080, %r2351; | |
mov.u32 %r18079, %r2352; | |
mov.u32 %r18078, %r2353; | |
mov.u32 %r18077, %r2354; | |
mov.u32 %r18076, %r2355; | |
mov.u32 %r18075, %r2356; | |
mov.u32 %r18083, %r17435; | |
mov.u32 %r18084, %r17433; | |
mov.u32 %r18085, %r17431; | |
mov.u32 %r18086, %r17429; | |
mov.u32 %r18087, %r17427; | |
mov.u32 %r18088, %r17425; | |
mov.u32 %r18089, %r17423; | |
mov.u32 %r18090, %r17421; | |
BB12_592: | |
mov.u32 %r2372, %r18075; | |
mov.u32 %r2371, %r18076; | |
mov.u32 %r2370, %r18077; | |
mov.u32 %r2369, %r18078; | |
mov.u32 %r2368, %r18079; | |
mov.u32 %r2367, %r18080; | |
mov.u32 %r2366, %r18081; | |
mov.u32 %r2365, %r18082; | |
mov.u32 %r2364, %r18083; | |
mov.u32 %r2363, %r18084; | |
mov.u32 %r2362, %r18085; | |
mov.u32 %r2361, %r18086; | |
mov.u32 %r2360, %r18087; | |
mov.u32 %r2359, %r18088; | |
mov.u32 %r2358, %r18089; | |
mov.u32 %r2357, %r18090; | |
setp.le.u32 %p305, %r17979, %r2372; | |
mov.u32 %r17995, %r2372; | |
mov.u32 %r17996, %r2371; | |
mov.u32 %r17997, %r2370; | |
mov.u32 %r17998, %r2369; | |
mov.u32 %r17999, %r2368; | |
mov.u32 %r18000, %r2367; | |
mov.u32 %r18001, %r2366; | |
mov.u32 %r18002, %r2365; | |
mov.u32 %r18003, %r2364; | |
mov.u32 %r18004, %r2363; | |
mov.u32 %r18005, %r2362; | |
mov.u32 %r18006, %r2361; | |
mov.u32 %r18007, %r2360; | |
mov.u32 %r18008, %r2359; | |
mov.u32 %r18009, %r2358; | |
mov.u32 %r18010, %r2357; | |
@%p305 bra BB12_594; | |
st.global.u32 [%rd153], %r2372; | |
st.global.u32 [%rd153+64], %r17979; | |
st.global.u32 [%rd153+4], %r2371; | |
st.global.u32 [%rd153+68], %r17980; | |
st.global.u32 [%rd153+8], %r2370; | |
st.global.u32 [%rd153+72], %r17981; | |
st.global.u32 [%rd153+12], %r2369; | |
st.global.u32 [%rd153+76], %r17982; | |
st.global.u32 [%rd153+16], %r2368; | |
st.global.u32 [%rd153+80], %r17983; | |
st.global.u32 [%rd153+20], %r2367; | |
st.global.u32 [%rd153+84], %r17984; | |
st.global.u32 [%rd153+24], %r2366; | |
st.global.u32 [%rd153+88], %r17985; | |
st.global.u32 [%rd153+28], %r2365; | |
st.global.u32 [%rd153+92], %r17986; | |
st.global.u32 [%rd153+32], %r2364; | |
st.global.u32 [%rd153+96], %r17987; | |
st.global.u32 [%rd153+36], %r2363; | |
st.global.u32 [%rd153+100], %r17988; | |
st.global.u32 [%rd153+40], %r2362; | |
st.global.u32 [%rd153+104], %r17989; | |
st.global.u32 [%rd153+44], %r2361; | |
st.global.u32 [%rd153+108], %r17990; | |
st.global.u32 [%rd153+48], %r2360; | |
st.global.u32 [%rd153+112], %r17991; | |
st.global.u32 [%rd153+52], %r2359; | |
st.global.u32 [%rd153+116], %r17992; | |
st.global.u32 [%rd153+56], %r2358; | |
st.global.u32 [%rd153+120], %r17993; | |
st.global.u32 [%rd153+60], %r2357; | |
st.global.u32 [%rd153+124], %r17994; | |
mov.u32 %r17349, %r17994; | |
mov.u32 %r17351, %r17993; | |
mov.u32 %r17353, %r17992; | |
mov.u32 %r17355, %r17991; | |
mov.u32 %r17357, %r17990; | |
mov.u32 %r17359, %r17989; | |
mov.u32 %r17361, %r17988; | |
mov.u32 %r17363, %r17987; | |
mov.u32 %r17365, %r17986; | |
mov.u32 %r17367, %r17985; | |
mov.u32 %r17369, %r17984; | |
mov.u32 %r17371, %r17983; | |
mov.u32 %r17373, %r17982; | |
mov.u32 %r17375, %r17981; | |
mov.u32 %r17377, %r17980; | |
mov.u32 %r17379, %r17979; | |
mov.u32 %r17994, %r2357; | |
mov.u32 %r17993, %r2358; | |
mov.u32 %r17992, %r2359; | |
mov.u32 %r17991, %r2360; | |
mov.u32 %r17990, %r2361; | |
mov.u32 %r17989, %r2362; | |
mov.u32 %r17988, %r2363; | |
mov.u32 %r17987, %r2364; | |
mov.u32 %r17986, %r2365; | |
mov.u32 %r17985, %r2366; | |
mov.u32 %r17984, %r2367; | |
mov.u32 %r17983, %r2368; | |
mov.u32 %r17982, %r2369; | |
mov.u32 %r17981, %r2370; | |
mov.u32 %r17980, %r2371; | |
mov.u32 %r17979, %r2372; | |
mov.u32 %r17995, %r17379; | |
mov.u32 %r17996, %r17377; | |
mov.u32 %r17997, %r17375; | |
mov.u32 %r17998, %r17373; | |
mov.u32 %r17999, %r17371; | |
mov.u32 %r18000, %r17369; | |
mov.u32 %r18001, %r17367; | |
mov.u32 %r18002, %r17365; | |
mov.u32 %r18003, %r17363; | |
mov.u32 %r18004, %r17361; | |
mov.u32 %r18005, %r17359; | |
mov.u32 %r18006, %r17357; | |
mov.u32 %r18007, %r17355; | |
mov.u32 %r18008, %r17353; | |
mov.u32 %r18009, %r17351; | |
mov.u32 %r18010, %r17349; | |
BB12_594: | |
mov.u32 %r2404, %r17979; | |
mul.lo.s64 %rd2499, %rd156, 1792; | |
add.s64 %rd2500, %rd6, %rd2499; | |
bfe.u32 %r7502, %r2197, 22, 6; | |
mul.wide.u32 %rd2501, %r7502, 28; | |
add.s64 %rd2502, %rd2500, %rd2501; | |
ld.global.u32 %r2405, [%rd2502+-4]; | |
and.b32 %r7503, %r2405, 65535; | |
mul.wide.u32 %rd2503, %r7503, 1792; | |
add.s64 %rd2504, %rd4, %rd2503; | |
bfe.u32 %r7504, %r2405, 16, 6; | |
mul.wide.u32 %rd2505, %r7504, 28; | |
add.s64 %rd2506, %rd2504, %rd2505; | |
ld.global.u32 %r2406, [%rd2506+-8]; | |
and.b32 %r7505, %r2406, 65535; | |
mul.wide.u32 %rd2507, %r7505, 1792; | |
add.s64 %rd2508, %rd6, %rd2507; | |
bfe.u32 %r7506, %r2406, 16, 6; | |
mul.wide.u32 %rd2509, %r7506, 28; | |
add.s64 %rd2510, %rd2508, %rd2509; | |
ld.global.u32 %r2407, [%rd2510+-8]; | |
and.b32 %r7507, %r2407, 65535; | |
mul.wide.u32 %rd2511, %r7507, 1792; | |
add.s64 %rd2512, %rd4, %rd2511; | |
cvt.u64.u32 %rd172, %r7503; | |
cvt.u64.u32 %rd173, %r7505; | |
cvt.u64.u32 %rd174, %r7507; | |
bfe.u32 %r7508, %r2407, 16, 6; | |
mul.wide.u32 %rd2513, %r7508, 28; | |
add.s64 %rd2514, %rd2512, %rd2513; | |
ld.global.u32 %r2408, [%rd2514+-12]; | |
and.b32 %r7509, %r2408, 65535; | |
cvt.u64.u32 %rd175, %r7509; | |
bfe.u32 %r7510, %r2408, 16, 6; | |
mul.wide.u32 %rd2515, %r7509, 1792; | |
add.s64 %rd2516, %rd415, %rd2515; | |
mul.wide.u32 %rd2517, %r7510, 28; | |
add.s64 %rd2518, %rd2516, %rd2517; | |
ld.global.u32 %r7511, [%rd2518]; | |
and.b32 %r7512, %r7511, 65535; | |
bfe.u32 %r7513, %r7511, 16, 6; | |
mul.wide.u32 %rd2519, %r7512, 1792; | |
add.s64 %rd2520, %rd414, %rd2519; | |
mul.wide.u32 %rd2521, %r7513, 28; | |
add.s64 %rd2522, %rd2520, %rd2521; | |
ld.global.u32 %r7514, [%rd2522]; | |
and.b32 %r7515, %r7514, 65535; | |
shl.b32 %r7516, %r7515, 6; | |
bfe.u32 %r7517, %r7514, 16, 6; | |
or.b32 %r2409, %r7516, %r7517; | |
st.global.u32 [%rd153+128], %r2409; | |
bfe.u32 %r7518, %r7511, 22, 6; | |
mul.wide.u32 %rd2523, %r7518, 28; | |
add.s64 %rd2524, %rd2520, %rd2523; | |
ld.global.u32 %r7519, [%rd2524]; | |
and.b32 %r7520, %r7519, 65535; | |
shl.b32 %r7521, %r7520, 6; | |
bfe.u32 %r7522, %r7519, 16, 6; | |
or.b32 %r17880, %r7521, %r7522; | |
st.global.u32 [%rd153+132], %r17880; | |
setp.le.u32 %p306, %r2409, %r17880; | |
mov.u32 %r17879, %r2409; | |
@%p306 bra BB12_596; | |
st.global.u32 [%rd153+128], %r17880; | |
st.global.u32 [%rd153+132], %r2409; | |
mov.u32 %r17525, %r17880; | |
mov.u32 %r17880, %r2409; | |
mov.u32 %r17879, %r17525; | |
BB12_596: | |
mov.u32 %r17875, %r17879; | |
mov.u32 %r17876, %r17880; | |
bfe.u32 %r7523, %r2408, 22, 6; | |
mul.lo.s64 %rd2525, %rd175, 1792; | |
add.s64 %rd2526, %rd415, %rd2525; | |
mul.wide.u32 %rd2527, %r7523, 28; | |
add.s64 %rd2528, %rd2526, %rd2527; | |
ld.global.u32 %r7524, [%rd2528]; | |
and.b32 %r7525, %r7524, 65535; | |
bfe.u32 %r7526, %r7524, 16, 6; | |
mul.wide.u32 %rd2529, %r7525, 1792; | |
add.s64 %rd2530, %rd414, %rd2529; | |
mul.wide.u32 %rd2531, %r7526, 28; | |
add.s64 %rd2532, %rd2530, %rd2531; | |
ld.global.u32 %r7527, [%rd2532]; | |
and.b32 %r7528, %r7527, 65535; | |
shl.b32 %r7529, %r7528, 6; | |
bfe.u32 %r7530, %r7527, 16, 6; | |
or.b32 %r2413, %r7529, %r7530; | |
st.global.u32 [%rd153+136], %r2413; | |
bfe.u32 %r7531, %r7524, 22, 6; | |
mul.wide.u32 %rd2533, %r7531, 28; | |
add.s64 %rd2534, %rd2530, %rd2533; | |
ld.global.u32 %r7532, [%rd2534]; | |
and.b32 %r7533, %r7532, 65535; | |
shl.b32 %r7534, %r7533, 6; | |
bfe.u32 %r7535, %r7532, 16, 6; | |
or.b32 %r17882, %r7534, %r7535; | |
st.global.u32 [%rd153+140], %r17882; | |
setp.le.u32 %p307, %r2413, %r17882; | |
mov.u32 %r17881, %r2413; | |
@%p307 bra BB12_598; | |
st.global.u32 [%rd153+136], %r17882; | |
st.global.u32 [%rd153+140], %r2413; | |
mov.u32 %r17531, %r17882; | |
mov.u32 %r17882, %r2413; | |
mov.u32 %r17881, %r17531; | |
BB12_598: | |
mov.u32 %r2416, %r17881; | |
mov.u32 %r2415, %r17882; | |
setp.le.u32 %p308, %r17875, %r2416; | |
mov.u32 %r17877, %r2416; | |
mov.u32 %r17878, %r2415; | |
@%p308 bra BB12_600; | |
st.global.u32 [%rd153+128], %r2416; | |
st.global.u32 [%rd153+136], %r17875; | |
st.global.u32 [%rd153+132], %r2415; | |
st.global.u32 [%rd153+140], %r17876; | |
mov.u32 %r17528, %r17876; | |
mov.u32 %r17530, %r17875; | |
mov.u32 %r17876, %r2415; | |
mov.u32 %r17875, %r2416; | |
mov.u32 %r17877, %r17530; | |
mov.u32 %r17878, %r17528; | |
BB12_600: | |
mov.u32 %r17867, %r17875; | |
mov.u32 %r17868, %r17876; | |
mov.u32 %r17869, %r17877; | |
mov.u32 %r17870, %r17878; | |
mul.lo.s64 %rd2535, %rd174, 1792; | |
add.s64 %rd2536, %rd4, %rd2535; | |
bfe.u32 %r7536, %r2407, 22, 6; | |
mul.wide.u32 %rd2537, %r7536, 28; | |
add.s64 %rd2538, %rd2536, %rd2537; | |
ld.global.u32 %r2421, [%rd2538+-12]; | |
and.b32 %r7537, %r2421, 65535; | |
cvt.u64.u32 %rd176, %r7537; | |
bfe.u32 %r7538, %r2421, 16, 6; | |
mul.wide.u32 %rd2539, %r7537, 1792; | |
add.s64 %rd2540, %rd415, %rd2539; | |
mul.wide.u32 %rd2541, %r7538, 28; | |
add.s64 %rd2542, %rd2540, %rd2541; | |
ld.global.u32 %r7539, [%rd2542]; | |
and.b32 %r7540, %r7539, 65535; | |
bfe.u32 %r7541, %r7539, 16, 6; | |
mul.wide.u32 %rd2543, %r7540, 1792; | |
add.s64 %rd2544, %rd414, %rd2543; | |
mul.wide.u32 %rd2545, %r7541, 28; | |
add.s64 %rd2546, %rd2544, %rd2545; | |
ld.global.u32 %r7542, [%rd2546]; | |
and.b32 %r7543, %r7542, 65535; | |
shl.b32 %r7544, %r7543, 6; | |
bfe.u32 %r7545, %r7542, 16, 6; | |
or.b32 %r2422, %r7544, %r7545; | |
st.global.u32 [%rd153+144], %r2422; | |
bfe.u32 %r7546, %r7539, 22, 6; | |
mul.wide.u32 %rd2547, %r7546, 28; | |
add.s64 %rd2548, %rd2544, %rd2547; | |
ld.global.u32 %r7547, [%rd2548]; | |
and.b32 %r7548, %r7547, 65535; | |
shl.b32 %r7549, %r7548, 6; | |
bfe.u32 %r7550, %r7547, 16, 6; | |
or.b32 %r17888, %r7549, %r7550; | |
st.global.u32 [%rd153+148], %r17888; | |
setp.le.u32 %p309, %r2422, %r17888; | |
mov.u32 %r17887, %r2422; | |
@%p309 bra BB12_602; | |
st.global.u32 [%rd153+144], %r17888; | |
st.global.u32 [%rd153+148], %r2422; | |
mov.u32 %r17545, %r17888; | |
mov.u32 %r17888, %r2422; | |
mov.u32 %r17887, %r17545; | |
BB12_602: | |
mov.u32 %r17883, %r17887; | |
mov.u32 %r17884, %r17888; | |
bfe.u32 %r7551, %r2421, 22, 6; | |
mul.lo.s64 %rd2549, %rd176, 1792; | |
add.s64 %rd2550, %rd415, %rd2549; | |
mul.wide.u32 %rd2551, %r7551, 28; | |
add.s64 %rd2552, %rd2550, %rd2551; | |
ld.global.u32 %r7552, [%rd2552]; | |
and.b32 %r7553, %r7552, 65535; | |
bfe.u32 %r7554, %r7552, 16, 6; | |
mul.wide.u32 %rd2553, %r7553, 1792; | |
add.s64 %rd2554, %rd414, %rd2553; | |
mul.wide.u32 %rd2555, %r7554, 28; | |
add.s64 %rd2556, %rd2554, %rd2555; | |
ld.global.u32 %r7555, [%rd2556]; | |
and.b32 %r7556, %r7555, 65535; | |
shl.b32 %r7557, %r7556, 6; | |
bfe.u32 %r7558, %r7555, 16, 6; | |
or.b32 %r2426, %r7557, %r7558; | |
st.global.u32 [%rd153+152], %r2426; | |
bfe.u32 %r7559, %r7552, 22, 6; | |
mul.wide.u32 %rd2557, %r7559, 28; | |
add.s64 %rd2558, %rd2554, %rd2557; | |
ld.global.u32 %r7560, [%rd2558]; | |
and.b32 %r7561, %r7560, 65535; | |
shl.b32 %r7562, %r7561, 6; | |
bfe.u32 %r7563, %r7560, 16, 6; | |
or.b32 %r17890, %r7562, %r7563; | |
st.global.u32 [%rd153+156], %r17890; | |
setp.le.u32 %p310, %r2426, %r17890; | |
mov.u32 %r17889, %r2426; | |
@%p310 bra BB12_604; | |
st.global.u32 [%rd153+152], %r17890; | |
st.global.u32 [%rd153+156], %r2426; | |
mov.u32 %r17551, %r17890; | |
mov.u32 %r17890, %r2426; | |
mov.u32 %r17889, %r17551; | |
BB12_604: | |
mov.u32 %r2429, %r17889; | |
mov.u32 %r2428, %r17890; | |
setp.le.u32 %p311, %r17883, %r2429; | |
mov.u32 %r17885, %r2429; | |
mov.u32 %r17886, %r2428; | |
@%p311 bra BB12_606; | |
st.global.u32 [%rd153+144], %r2429; | |
st.global.u32 [%rd153+152], %r17883; | |
st.global.u32 [%rd153+148], %r2428; | |
st.global.u32 [%rd153+156], %r17884; | |
mov.u32 %r17548, %r17884; | |
mov.u32 %r17550, %r17883; | |
mov.u32 %r17884, %r2428; | |
mov.u32 %r17883, %r2429; | |
mov.u32 %r17885, %r17550; | |
mov.u32 %r17886, %r17548; | |
BB12_606: | |
mov.u32 %r2433, %r17883; | |
mov.u32 %r2432, %r17884; | |
mov.u32 %r2431, %r17885; | |
mov.u32 %r2430, %r17886; | |
setp.le.u32 %p312, %r17867, %r2433; | |
mov.u32 %r17871, %r2433; | |
mov.u32 %r17872, %r2432; | |
mov.u32 %r17873, %r2431; | |
mov.u32 %r17874, %r2430; | |
@%p312 bra BB12_608; | |
st.global.u32 [%rd153+128], %r2433; | |
st.global.u32 [%rd153+144], %r17867; | |
st.global.u32 [%rd153+132], %r2432; | |
st.global.u32 [%rd153+148], %r17868; | |
st.global.u32 [%rd153+136], %r2431; | |
st.global.u32 [%rd153+152], %r17869; | |
st.global.u32 [%rd153+140], %r2430; | |
st.global.u32 [%rd153+156], %r17870; | |
mov.u32 %r17538, %r17870; | |
mov.u32 %r17540, %r17869; | |
mov.u32 %r17542, %r17868; | |
mov.u32 %r17544, %r17867; | |
mov.u32 %r17870, %r2430; | |
mov.u32 %r17869, %r2431; | |
mov.u32 %r17868, %r2432; | |
mov.u32 %r17867, %r2433; | |
mov.u32 %r17871, %r17544; | |
mov.u32 %r17872, %r17542; | |
mov.u32 %r17873, %r17540; | |
mov.u32 %r17874, %r17538; | |
BB12_608: | |
mov.u32 %r17851, %r17867; | |
mov.u32 %r17852, %r17868; | |
mov.u32 %r17853, %r17869; | |
mov.u32 %r17854, %r17870; | |
mov.u32 %r17855, %r17871; | |
mov.u32 %r17856, %r17872; | |
mov.u32 %r17857, %r17873; | |
mov.u32 %r17858, %r17874; | |
mul.lo.s64 %rd2559, %rd173, 1792; | |
add.s64 %rd2560, %rd6, %rd2559; | |
bfe.u32 %r7564, %r2406, 22, 6; | |
mul.wide.u32 %rd2561, %r7564, 28; | |
add.s64 %rd2562, %rd2560, %rd2561; | |
ld.global.u32 %r2442, [%rd2562+-8]; | |
and.b32 %r7565, %r2442, 65535; | |
mul.wide.u32 %rd2563, %r7565, 1792; | |
add.s64 %rd2564, %rd4, %rd2563; | |
cvt.u64.u32 %rd177, %r7565; | |
bfe.u32 %r7566, %r2442, 16, 6; | |
mul.wide.u32 %rd2565, %r7566, 28; | |
add.s64 %rd2566, %rd2564, %rd2565; | |
ld.global.u32 %r2443, [%rd2566+-12]; | |
and.b32 %r7567, %r2443, 65535; | |
cvt.u64.u32 %rd178, %r7567; | |
bfe.u32 %r7568, %r2443, 16, 6; | |
mul.wide.u32 %rd2567, %r7567, 1792; | |
add.s64 %rd2568, %rd415, %rd2567; | |
mul.wide.u32 %rd2569, %r7568, 28; | |
add.s64 %rd2570, %rd2568, %rd2569; | |
ld.global.u32 %r7569, [%rd2570]; | |
and.b32 %r7570, %r7569, 65535; | |
bfe.u32 %r7571, %r7569, 16, 6; | |
mul.wide.u32 %rd2571, %r7570, 1792; | |
add.s64 %rd2572, %rd414, %rd2571; | |
mul.wide.u32 %rd2573, %r7571, 28; | |
add.s64 %rd2574, %rd2572, %rd2573; | |
ld.global.u32 %r7572, [%rd2574]; | |
and.b32 %r7573, %r7572, 65535; | |
shl.b32 %r7574, %r7573, 6; | |
bfe.u32 %r7575, %r7572, 16, 6; | |
or.b32 %r2444, %r7574, %r7575; | |
st.global.u32 [%rd153+160], %r2444; | |
bfe.u32 %r7576, %r7569, 22, 6; | |
mul.wide.u32 %rd2575, %r7576, 28; | |
add.s64 %rd2576, %rd2572, %rd2575; | |
ld.global.u32 %r7577, [%rd2576]; | |
and.b32 %r7578, %r7577, 65535; | |
shl.b32 %r7579, %r7578, 6; | |
bfe.u32 %r7580, %r7577, 16, 6; | |
or.b32 %r17904, %r7579, %r7580; | |
st.global.u32 [%rd153+164], %r17904; | |
setp.le.u32 %p313, %r2444, %r17904; | |
mov.u32 %r17903, %r2444; | |
@%p313 bra BB12_610; | |
st.global.u32 [%rd153+160], %r17904; | |
st.global.u32 [%rd153+164], %r2444; | |
mov.u32 %r17581, %r17904; | |
mov.u32 %r17904, %r2444; | |
mov.u32 %r17903, %r17581; | |
BB12_610: | |
mov.u32 %r17899, %r17903; | |
mov.u32 %r17900, %r17904; | |
bfe.u32 %r7581, %r2443, 22, 6; | |
mul.lo.s64 %rd2577, %rd178, 1792; | |
add.s64 %rd2578, %rd415, %rd2577; | |
mul.wide.u32 %rd2579, %r7581, 28; | |
add.s64 %rd2580, %rd2578, %rd2579; | |
ld.global.u32 %r7582, [%rd2580]; | |
and.b32 %r7583, %r7582, 65535; | |
bfe.u32 %r7584, %r7582, 16, 6; | |
mul.wide.u32 %rd2581, %r7583, 1792; | |
add.s64 %rd2582, %rd414, %rd2581; | |
mul.wide.u32 %rd2583, %r7584, 28; | |
add.s64 %rd2584, %rd2582, %rd2583; | |
ld.global.u32 %r7585, [%rd2584]; | |
and.b32 %r7586, %r7585, 65535; | |
shl.b32 %r7587, %r7586, 6; | |
bfe.u32 %r7588, %r7585, 16, 6; | |
or.b32 %r2448, %r7587, %r7588; | |
st.global.u32 [%rd153+168], %r2448; | |
bfe.u32 %r7589, %r7582, 22, 6; | |
mul.wide.u32 %rd2585, %r7589, 28; | |
add.s64 %rd2586, %rd2582, %rd2585; | |
ld.global.u32 %r7590, [%rd2586]; | |
and.b32 %r7591, %r7590, 65535; | |
shl.b32 %r7592, %r7591, 6; | |
bfe.u32 %r7593, %r7590, 16, 6; | |
or.b32 %r17906, %r7592, %r7593; | |
st.global.u32 [%rd153+172], %r17906; | |
setp.le.u32 %p314, %r2448, %r17906; | |
mov.u32 %r17905, %r2448; | |
@%p314 bra BB12_612; | |
st.global.u32 [%rd153+168], %r17906; | |
st.glo |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment