80 lines
7.3 KiB
ArmAsm
80 lines
7.3 KiB
ArmAsm
|
|
code for sm_35
|
|
Function : _Z19mandelbrot_scanlineffffiiiiiPi
|
|
.headerflags @"EF_CUDA_SM35 EF_CUDA_PTX_SM(EF_CUDA_SM35)"
|
|
/* 0x0880a010a0a01000 */
|
|
/*0008*/ MOV R1, c[0x0][0x44]; /* 0x64c03c00089c0006 */
|
|
/*0010*/ S2R R0, SR_CTAID.Y; /* 0x86400000131c0002 */
|
|
/*0018*/ MOV R4, c[0x0][0x158]; /* 0x64c03c002b1c0012 */
|
|
/*0020*/ IMUL R2, R0, c[0x0][0x15c]; /* 0x61c018002b9c000a */
|
|
/*0028*/ IADD R0, R2, c[0x0][0x15c]; /* 0x608000002b9c0802 */
|
|
/*0030*/ S2R R9, SR_CTAID.X; /* 0x86400000129c0026 */
|
|
/*0038*/ IMNMX R11, R0, c[0x0][0x154], PT; /* 0x61081c002a9c002e */
|
|
/* 0x08b0a0100010b09c */
|
|
/*0048*/ IMAD R0, R9, c[0x0][0x158], R4; /* 0x510810002b1c2402 */
|
|
/*0050*/ ISETP.GE.AND P0, PT, R2, R11, PT; /* 0xdb681c00059c081e */
|
|
/*0058*/ IMNMX R0, R0, c[0x0][0x150], PT; /* 0x61081c002a1c0002 */
|
|
/*0060*/ @P0 EXIT ; /* 0x180000000000003c */
|
|
/*0068*/ IMUL R3, R9, c[0x0][0x158]; /* 0x61c018002b1c240e */
|
|
/*0070*/ SSY 0x1f8; /* 0x14800000c0000000 */
|
|
/*0078*/ ISETP.GE.AND P0, PT, R3, R0, PT; /* 0xdb681c00001c0c1e */
|
|
/* 0x08a0100010a01000 */
|
|
/*0088*/ @P0 BRA 0x1f0; /* 0x12000000b000003c */
|
|
/*0090*/ I2F.F32.S32 R4, R2; /* 0xe5c00000011ca812 */
|
|
/*0098*/ MOV R5, c[0x0][0x148]; /* 0x64c03c00291c0016 */
|
|
/*00a0*/ MOV R16, c[0x0][0x140]; /* 0x64c03c00281c0042 */
|
|
/*00a8*/ FFMA R4, R4, c[0x0][0x14c], R5; /* 0x4c001400299c1012 */
|
|
/*00b0*/ S2R R5, SR_TID.X; /* 0x86400000109c0016 */
|
|
/*00b8*/ MOV R6, RZ; /* 0xe4c03c007f9c001a */
|
|
/* 0x08800010a0a0a010 */
|
|
/*00c8*/ LOP.AND R10, R5, 0x1f; /* 0xc20000000f9c1429 */
|
|
/*00d0*/ ISETP.LT.AND P0, PT, RZ, c[0x0][0x160], PT; /* 0x5b181c002c1ffc1e */
|
|
/*00d8*/ IADD R12, R10, R3; /* 0xe0800000019c2832 */
|
|
/*00e0*/ I2F.F32.U32 R5, R12; /* 0xe5c00000061c2816 */
|
|
/*00e8*/ FFMA R5, R5, c[0x0][0x144], R16; /* 0x4c004000289c1416 */
|
|
/*00f0*/ @!P0 BRA 0x190; /* 0x120000004c20003c */
|
|
/*00f8*/ MOV R7, R4; /* 0xe4c03c00021c001e */
|
|
/* 0x0800b0a0a0100010 */
|
|
/*0108*/ MOV R8, R5; /* 0xe4c03c00029c0022 */
|
|
/*0110*/ PBK 0x190; /* 0x150000003c000000 */
|
|
/*0118*/ FMUL R13, R7, R7; /* 0xe3400000039c1c36 */
|
|
/*0120*/ FMUL R14, R8, R8; /* 0xe3400000041c203a */
|
|
/*0128*/ FADD R15, R14, R13; /* 0xe2c00000069c383e */
|
|
/*0130*/ FSETP.GT.AND P0, PT, R15, 4, PT; /* 0xb5a01e04001c3c1d */
|
|
/*0138*/ @P0 BRK ; /* 0x1a0000000000003c */
|
|
/* 0x080010ac809c8010 */
|
|
/*0148*/ IADD R6, R6, 0x1; /* 0xc0800000009c1819 */
|
|
/*0150*/ FADD R8, R8, R8; /* 0xe2c00000041c2022 */
|
|
/*0158*/ FADD R14, R14, -R13; /* 0xe2c10000069c383a */
|
|
/*0160*/ ISETP.LT.AND P0, PT, R6, c[0x0][0x160], PT; /* 0x5b181c002c1c181e */
|
|
/*0168*/ FFMA R7, R8, R7, R4; /* 0xcc001000039c201e */
|
|
/*0170*/ FADD R8, R5, R14; /* 0xe2c00000071c1422 */
|
|
/*0178*/ @!P0 BRK ; /* 0x1a0000000020003c */
|
|
/* 0x08b0a00010ac80b8 */
|
|
/*0188*/ BRA 0x118; /* 0x12007fffc41c003c */
|
|
/*0190*/ ISETP.GE.U32.AND P0, PT, R12, R0, PT; /* 0xdb601c00001c301e */
|
|
/*0198*/ IMAD R5, R2, c[0x0][0x150], R3; /* 0x51080c002a1c0816 */
|
|
/*01a0*/ IADD R5, R5, R10; /* 0xe0800000051c1416 */
|
|
/*01a8*/ @P0 BRA.U 0x1d8; /* 0x120000001400023c */
|
|
/*01b0*/ @!P0 MOV32I R8, 0x4; /* 0x740000000223c022 */
|
|
/*01b8*/ @!P0 IMAD R12.CC, R5, R8, c[0x0][0x168]; /* 0x910c20002d201432 */
|
|
/* 0x08b000b8b0a000a0 */
|
|
/*01c8*/ @!P0 IMAD.HI.X R13, R5, R8, c[0x0][0x16c]; /* 0x931820002da01436 */
|
|
/*01d0*/ @!P0 ST.E [R12], R6; /* 0xe480000000203018 */
|
|
/*01d8*/ IADD R3, R3, 0x20; /* 0xc0800000101c0c0d */
|
|
/*01e0*/ ISETP.LT.AND P0, PT, R3, R0, PT; /* 0xdb181c00001c0c1e */
|
|
/*01e8*/ @P0 BRA 0xb0; /* 0x12007fff6000003c */
|
|
/*01f0*/ IADD.S R2, R2, 0x1; /* 0xc080000000dc0809 */
|
|
/*01f8*/ ISETP.LT.AND P0, PT, R2, R11, PT; /* 0xdb181c00059c081e */
|
|
/* 0x0800000000b810b8 */
|
|
/*0208*/ @P0 BRA 0x68; /* 0x12007fff2c00003c */
|
|
/*0210*/ MOV RZ, RZ; /* 0xe4c03c007f9c03fe */
|
|
/*0218*/ EXIT ; /* 0x18000000001c003c */
|
|
/*0220*/ BRA 0x220; /* 0x12007ffffc1c003c */
|
|
/*0228*/ NOP; /* 0x85800000001c3c02 */
|
|
/*0230*/ NOP; /* 0x85800000001c3c02 */
|
|
/*0238*/ NOP; /* 0x85800000001c3c02 */
|
|
...................................................
|
|
|
|
|