[text] SASS code using cuobjdump

Viewer

copydownloadembedprintName: SASS code using cuobjdump
  1.   .headerflags    @"EF_CUDA_SM60 EF_CUDA_PTX_SM(EF_CUDA_SM60)"
  2.                                                                                      /* 0x001fc400fec007f6 */
  3.         /*0008*/                   MOV R1, c[0x0][0x20] ;                            /* 0x4c98078000870001 */
  4.         /*0010*/                   MOV R2, RZ ;                                      /* 0x5c9807800ff70002 */
  5.         /*0018*/                   CS2R RZ, SR_CLOCKHI ;                             /* 0x50c80000051700ff */
  6.                                                                                      /* 0x001f9800fe2007e6 */
  7.         /*0028*/                   CS2R R3, SR_CLOCKHI ;                             /* 0x50c8000005170003 */
  8.         /*0030*/                   CS2R RZ, SR_CLOCKLO ;                             /* 0x50c80000050700ff */
  9.         /*0038*/                   CS2R R0, SR_CLOCKLO ;                             /* 0x50c8000005070000 */
  10.                                                                                      /* 0x001fb400fcc007f1 */
  11.         /*0048*/                   CS2R RZ, SR_CLOCKHI ;                             /* 0x50c80000051700ff */
  12.         /*0050*/                   CS2R R4, SR_CLOCKHI ;                             /* 0x50c8000005170004 */
  13.         /*0058*/                   ISETP.NE.U32.AND P0, PT, R3, R4, PT ;             /* 0x5b6a038000470307 */
  14.                                                                                      /* 0x001fb400fec007fd */
  15.         /*0068*/              @!P0 BRA 0x90 ;                                        /* 0xe24000000208000f */
  16.         /*0070*/                   IADD32I R2, R2, 0x1 ;                             /* 0x1c00000000170202 */
  17.         /*0078*/                   ISETP.GE.U32.AND P0, PT, R2, c[0x0][0x10c], PT ;  /* 0x4b6c038004370207 */
  18.                                                                                      /* 0x001fc800fe2007fd */
  19.         /*0088*/              @!P0 BRA 0x18 ;                                        /* 0xe2400ffff888000f */
  20.         /*0090*/                   MOV R2, c[0x0][0x140] ;                           /* 0x4c98078005070002 */
  21.         /*0098*/                   MOV R3, c[0x0][0x144] ;                           /* 0x4c98078005170003 */
  22.                                                                                      /* 0x001fc401fec000bd */
  23.         /*00a8*/                   LDG.E.CV R3, [R2] ;                               /* 0xeed4e00000070203 */
  24.         /*00b0*/                   MOV R4, RZ ;                                      /* 0x5c9807800ff70004 */
  25.         /*00b8*/                   CS2R RZ, SR_CLOCKHI ;                             /* 0x50c80000051700ff */
  26.                                                                                      /* 0x001f9800fe2007e6 */
  27.         /*00c8*/                   CS2R R5, SR_CLOCKHI ;                             /* 0x50c8000005170005 */
  28.         /*00d0*/                   CS2R RZ, SR_CLOCKLO ;                             /* 0x50c80000050700ff */
  29.         /*00d8*/                   CS2R R2, SR_CLOCKLO ;                             /* 0x50c8000005070002 */
  30.                                                                                      /* 0x001fb400fcc007f1 */
  31.         /*00e8*/                   CS2R RZ, SR_CLOCKHI ;                             /* 0x50c80000051700ff */
  32.         /*00f0*/                   CS2R R6, SR_CLOCKHI ;                             /* 0x50c8000005170006 */
  33.         /*00f8*/                   ISETP.NE.U32.AND P0, PT, R5, R6, PT ;             /* 0x5b6a038000670507 */
  34.                                                                                      /* 0x001fb400fec007fd */
  35.         /*0108*/              @!P0 BRA 0x130 ;                                       /* 0xe24000000208000f */
  36.         /*0110*/                   IADD32I R4, R4, 0x1 ;                             /* 0x1c00000000170404 */
  37.         /*0118*/                   ISETP.GE.U32.AND P0, PT, R4, c[0x0][0x10c], PT ;  /* 0x4b6c038004370407 */
  38.                                                                                      /* 0x003f9820e3a007fd */
  39.         /*0128*/              @!P0 BRA 0xb8 ;                                        /* 0xe2400ffff888000f */
  40.         /*0130*/                   I2F.F32.U32 R3, R3 ;                              /* 0x5cb8000000370a03 */
  41.         /*0138*/                   IADD32I R4, R3, 0x1800000 ;                       /* 0x1c00180000070304 */
  42.                                                                                      /* 0x001ff400fda007f6 */
  43.         /*0148*/                   LOP32I.AND R4, R4, 0x7f800000 ;                   /* 0x0407f80000070404 */
  44.         /*0150*/                   ISETP.GT.U32.AND P0, PT, R4, c[0x2][0x0], PT ;    /* 0x4b68038800070407 */
  45.         /*0158*/               @P0 BRA 0x180 ;                                       /* 0xe24000000200000f */
  46.                                                                                      /* 0x001ff400fe0007fd */
  47.         /*0168*/                   CAL 0x200 ;                                       /* 0xe260000009000040 */
  48.         /*0170*/         {         MOV R7, R4 ;                                      /* 0x5c98078000470007 */
  49.         /*0178*/                   BRA 0x1b0         }
  50.                                                                                      /* 0xe24000000307000f */
  51.                                                                                      /* 0x001fd801fec0071d */
  52.         /*0188*/                   MUFU.RCP R4, R3 ;                                 /* 0x5080000000470304 */
  53.         /*0190*/                   FFMA R5, R3, R4, c[0x2][0x4] ;                    /* 0x5180020800170305 */
  54.         /*0198*/                   FADD.FTZ R5, -R5, -RZ ;                           /* 0x5c5930000ff70505 */
  55.                                                                                      /* 0x001fc400fe2007f6 */
  56.         /*01a8*/                   FFMA R7, R4, R5, R4 ;                             /* 0x5980020000570407 */
  57.         /*01b0*/                   IADD R6, -R0, R2 ;                                /* 0x5c12000000270006 */
  58.         /*01b8*/                   MOV R2, c[0x0][0x148] ;                           /* 0x4c98078005270002 */
  59.                                                                                      /* 0x001fc400fe0007f2 */
  60.         /*01c8*/                   MOV R3, c[0x0][0x14c] ;                           /* 0x4c98078005370003 */
  61.         /*01d0*/         {         MOV R4, c[0x0][0x150] ;                           /* 0x4c98078005470004 */
  62.         /*01d8*/                   STG.E [R2], R7         }
  63.                                                                                      /* 0xeedc200000070207 */
  64.                                                                                      /* 0x001ffc00fe2007f2 */
  65.         /*01e8*/                   MOV R5, c[0x0][0x154] ;                           /* 0x4c98078005570005 */
  66.         /*01f0*/                   STG.E [R4], R6 ;                                  /* 0xeedc200000070406 */
  67.         /*01f8*/                   EXIT ;                                            /* 0xe30000000007000f */
  68.                                                                                      /* 0x001fb400fec007f6 */
  69.         /*0208*/                   SHL R4, R3, 0x1 ;                                 /* 0x3848000000170304 */
  70.         /*0210*/                   SHR.U32 R4, R4, 0x18 ;                            /* 0x3828000001870404 */
  71.         /*0218*/                   ISETP.NE.U32.AND P0, PT, R4, RZ, PT ;             /* 0x5b6a03800ff70407 */
  72.                                                                                      /* 0x001fb400fec007fd */
  73.         /*0228*/               @P0 BRA 0x2a0 ;                                       /* 0xe24000000700000f */
  74.         /*0230*/                   SHL R4, R3, 0x1 ;                                 /* 0x3848000000170304 */
  75.         /*0238*/                   ISETP.NE.AND P0, PT, R4, RZ, PT ;                 /* 0x5b6b03800ff70407 */
  76.                                                                                      /* 0x001fc801ffa00712 */
  77.         /*0248*/              @!P0 MUFU.RCP R4, R3 ;                                 /* 0x5080000000480304 */
  78.         /*0250*/              @!P0 RET ;                                             /* 0xe32000000008000f */
  79.         /*0258*/                   FFMA R3, R3, 1.84467440737095516160e+19, RZ ;     /* 0x32807fdf80070303 */
  80.                                                                                      /* 0x001fd801fec0071d */
  81.         /*0268*/                   MUFU.RCP R4, R3 ;                                 /* 0x5080000000470304 */
  82.         /*0270*/                   FFMA R5, R3, R4, c[0x2][0x4] ;                    /* 0x5180020800170305 */
  83.         /*0278*/                   FADD.FTZ R5, -R5, -RZ ;                           /* 0x5c5930000ff70505 */
  84.                                                                                      /* 0x001ffc00fe0007f6 */
  85.         /*0288*/                   FFMA R4, R4, R5, R4 ;                             /* 0x5980020000570404 */
  86.         /*0290*/         {         FFMA R4, R4, 1.84467440737095516160e+19, RZ ;     /* 0x32807fdf80070404 */
  87.         /*0298*/                   RET         }
  88.                                                                                      /* 0xe32000000007000f */
  89.                                                                                      /* 0x001ff400fda007f6 */
  90.         /*02a8*/                   IADD32I R5, R4, -0xfd ;                           /* 0x1c0ffffff0370405 */
  91.         /*02b0*/                   ISETP.GT.U32.AND P0, PT, R5, 0x1, PT ;            /* 0x3668038000170507 */
  92.         /*02b8*/               @P0 BRA 0x3e0 ;                                       /* 0xe24000001200000f */
  93.                                                                                      /* 0x001fd000fe2007f1 */
  94.         /*02c8*/                   LOP32I.AND R11, R3, 0x7fffff ;                    /* 0x040007fffff7030b */
  95.         /*02d0*/                   MOV32I R10, 0x3 ;                                 /* 0x010000000037f00a */
  96.         /*02d8*/                   IADD32I R4, R4, -0xfc ;                           /* 0x1c0ffffff0470404 */
  97.                                                                                      /* 0x001c7400fe0007f2 */
  98.         /*02e8*/                   LOP32I.OR R6, R11, 0x3f800000 ;                   /* 0x0423f80000070b06 */
  99.         /*02f0*/         {         SHL R10, R10, R5 ;                                /* 0x5c48000000570a0a */
  100.         /*02f8*/                   MUFU.RCP R7, R6         }
  101.                                                                                      /* 0x5080000000470607 */
  102.                                                                                      /* 0x381fc400fcc00ff6 */
  103.         /*0308*/                   FFMA R8, R6, R7, c[0x2][0x4] ;                    /* 0x5180038800170608 */
  104.         /*0310*/                   FADD.FTZ R8, -R8, -RZ ;                           /* 0x5c5930000ff70808 */
  105.         /*0318*/                   FFMA.RM R9, R7.reuse, R8.reuse, R7.reuse ;        /* 0x5988038000870709 */
  106.                                                                                      /* 0x001fd440fe2007f5 */
  107.         /*0328*/                   FFMA.RP R8, R7, R8, R7 ;                          /* 0x5990038000870708 */
  108.         /*0330*/                   LOP32I.AND R7, R9.reuse, 0x7fffff ;               /* 0x040007fffff70907 */
  109.         /*0338*/                   FSET.NEU.FTZ.AND R8, R9, R8, PT ;                 /* 0x588d038000870908 */
  110.                                                                                      /* 0x001fc400fca007f1 */
  111.         /*0348*/                   LOP32I.OR R7, R7, 0x800000 ;                      /* 0x0420080000070707 */
  112.         /*0350*/                   IADD R8, -R8, RZ ;                                /* 0x5c1200000ff70808 */
  113.         /*0358*/                   LOP.AND R10, R10, R7 ;                            /* 0x5c47000000770a0a */
  114.                                                                                      /* 0x001fd800fe8407f1 */
  115.         /*0368*/                   LOP3.LUT.NZ P1, RZ, R8, R5.reuse, R7, 0xf8 ;      /* 0x5be103bf805708ff */
  116.         /*0370*/                   SHR.U32 R4, R7, R4 ;                              /* 0x5c28000000470704 */
  117.         /*0378*/                   SHR.U32 R5, R10, R5 ;                             /* 0x5c28000000570a05 */
  118.                                                                                      /* 0x001f8400fd8207f1 */
  119.         /*0388*/                   LOP.AND.NZ P2, RZ, R5.reuse, 0x2 ;                /* 0x38423000002705ff */
  120.         /*0390*/                   LOP.AND.NZ P0, RZ, R5, 0x1 ;                      /* 0x38403000001705ff */
  121.         /*0398*/                   PSETP.OR.AND P1, PT, P1, P2, PT ;                 /* 0x509003804107100f */
  122.                                                                                      /* 0x001ff400fda007ec */
  123.         /*03a8*/                   ISETP.NE.U32.AND P2, PT, R11, RZ, PT ;            /* 0x5b6a03800ff70b17 */
  124.         /*03b0*/                   PSETP.AND.AND P0, PT, P0, P1, PT ;                /* 0x5090038020070007 */
  125.         /*03b8*/               @P0 IADD32I R4, R4, 0x1 ;                             /* 0x1c00000000100404 */
  126.                                                                                      /* 0x001ffc00fe0007f6 */
  127.         /*03c8*/              @!P2 SHL R4, R4, 0x1 ;                                 /* 0x38480000001a0404 */
  128.         /*03d0*/         {         LOP3.LUT R4, R4, c[0x2][0x8], R3, 0xf8 ;          /* 0x02f8018800270404 */
  129.         /*03d8*/                   RET         }
  130.                                                                                      /* 0xe32000000007000f */
  131.                                                                                      /* 0x001ffc01ffe0071d */
  132.         /*03e8*/                   MUFU.RCP R4, R3 ;                                 /* 0x5080000000470304 */
  133.         /*03f0*/                   RET ;                                             /* 0xe32000000007000f */
  134.         /*03f8*/                   BRA 0x3f8 ;                                       /* 0xe2400fffff87000f */
  135.                 ...........................
  136.  
  137.  

Editor

You can edit this paste and save as new:


File Description
  • SASS code using cuobjdump
  • Paste Code
  • 29 Dec-2020
  • 14.26 Kb
You can Share it: