1%def bindiv(result="", special="", rem=""): 2/* 3 * 32-bit binary div/rem operation. Handles special case of op0=minint and 4 * op1=-1. 5 */ 6 /* div/rem vAA, vBB, vCC */ 7 movzbl 2(rPC), %eax # eax <- BB 8 movzbl 3(rPC), %ecx # ecx <- CC 9 GET_VREG %eax, %eax # eax <- vBB 10 GET_VREG %ecx, %ecx # ecx <- vCC 11 mov rIBASE, LOCAL0(%esp) 12 testl %ecx, %ecx 13 je common_errDivideByZero 14 movl %eax, %edx 15 orl %ecx, %edx 16 testl $$0xFFFFFF00, %edx # If both arguments are less 17 # than 8-bit and +ve 18 jz .L${opcode}_8 # Do 8-bit divide 19 testl $$0xFFFF0000, %edx # If both arguments are less 20 # than 16-bit and +ve 21 jz .L${opcode}_16 # Do 16-bit divide 22 cmpl $$-1, %ecx 23 jne .L${opcode}_32 24 cmpl $$0x80000000, %eax 25 jne .L${opcode}_32 26 movl $special, $result 27 jmp .L${opcode}_finish 28% add_slow_path(bindiv_helper, result, rem) 29 30%def bindiv_helper(result, rem): 31.L${opcode}_32: 32 cltd 33 idivl %ecx 34 jmp .L${opcode}_finish 35.L${opcode}_8: 36 div %cl # 8-bit divide otherwise. 37 # Remainder in %ah, quotient in %al 38 .if $rem 39 movl %eax, %edx 40 shr $$8, %edx 41 .else 42 andl $$0x000000FF, %eax 43 .endif 44 jmp .L${opcode}_finish 45.L${opcode}_16: 46 xorl %edx, %edx # Clear %edx before divide 47 div %cx 48.L${opcode}_finish: 49 SET_VREG $result, rINST 50 mov LOCAL0(%esp), rIBASE 51 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 52 53%def bindiv2addr(result="", special=""): 54/* 55 * 32-bit binary div/rem operation. Handles special case of op0=minint and 56 * op1=-1. 57 */ 58 /* div/rem/2addr vA, vB */ 59 movzx rINSTbl, %ecx # eax <- BA 60 mov rIBASE, LOCAL0(%esp) 61 sarl $$4, %ecx # ecx <- B 62 GET_VREG %ecx, %ecx # eax <- vBB 63 andb $$0xf, rINSTbl # rINST <- A 64 GET_VREG %eax, rINST # eax <- vBB 65 testl %ecx, %ecx 66 je common_errDivideByZero 67 cmpl $$-1, %ecx 68 jne .L${opcode}_continue_div2addr 69 cmpl $$0x80000000, %eax 70 jne .L${opcode}_continue_div2addr 71 movl $special, $result 72 SET_VREG $result, rINST 73 mov LOCAL0(%esp), rIBASE 74 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 75% add_slow_path(bindiv2addr_helper, result) 76 77%def bindiv2addr_helper(result): 78.L${opcode}_continue_div2addr: 79 cltd 80 idivl %ecx 81 SET_VREG $result, rINST 82 mov LOCAL0(%esp), rIBASE 83 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 84 85%def bindivLit16(result="", special=""): 86/* 87 * 32-bit binary div/rem operation. Handles special case of op0=minint and 88 * op1=-1. 89 */ 90 /* div/rem/lit16 vA, vB, #+CCCC */ 91 /* Need A in rINST, ssssCCCC in ecx, vB in eax */ 92 movzbl rINSTbl, %eax # eax <- 000000BA 93 sarl $$4, %eax # eax <- B 94 GET_VREG %eax, %eax # eax <- vB 95 movswl 2(rPC), %ecx # ecx <- ssssCCCC 96 andb $$0xf, rINSTbl # rINST <- A 97 testl %ecx, %ecx 98 je common_errDivideByZero 99 cmpl $$-1, %ecx 100 jne .L${opcode}_continue_div 101 cmpl $$0x80000000, %eax 102 jne .L${opcode}_continue_div 103 movl $special, %eax 104 SET_VREG %eax, rINST 105 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 106 107.L${opcode}_continue_div: 108 mov rIBASE, LOCAL0(%esp) 109 cltd 110 idivl %ecx 111 SET_VREG $result, rINST 112 mov LOCAL0(%esp), rIBASE 113 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 114 115%def bindivLit8(result="", special=""): 116/* 117 * 32-bit div/rem "lit8" binary operation. Handles special case of 118 * op0=minint & op1=-1 119 */ 120 /* div/rem/lit8 vAA, vBB, #+CC */ 121 movzbl 2(rPC), %eax # eax <- BB 122 movsbl 3(rPC), %ecx # ecx <- ssssssCC 123 GET_VREG %eax, %eax # eax <- rBB 124 testl %ecx, %ecx 125 je common_errDivideByZero 126 cmpl $$0x80000000, %eax 127 jne .L${opcode}_continue_div 128 cmpl $$-1, %ecx 129 jne .L${opcode}_continue_div 130 movl $special, %eax 131 SET_VREG %eax, rINST 132 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 133 134.L${opcode}_continue_div: 135 mov rIBASE, LOCAL0(%esp) 136 cltd 137 idivl %ecx 138 SET_VREG $result, rINST 139 mov LOCAL0(%esp), rIBASE 140 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 141 142%def binop(result="%eax", instr=""): 143/* 144 * Generic 32-bit binary operation. Provide an "instr" line that 145 * specifies an instruction that performs "result = eax op VREG_ADDRESS(%ecx)". 146 * This could be an x86 instruction or a function call. (If the result 147 * comes back in a register other than eax, you can override "result".) 148 * 149 * For: add-int, sub-int, and-int, or-int, 150 * xor-int, shl-int, shr-int, ushr-int 151 */ 152 /* binop vAA, vBB, vCC */ 153 movzbl 2(rPC), %eax # eax <- BB 154 movzbl 3(rPC), %ecx # ecx <- CC 155 GET_VREG %eax, %eax # eax <- vBB 156 $instr VREG_ADDRESS(%ecx), %eax 157 SET_VREG $result, rINST 158 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 159 160%def binop1(result="%eax", tmp="%ecx", instr=""): 161/* 162 * Generic 32-bit binary operation in which both operands loaded to 163 * registers (op0 in eax, op1 in ecx). 164 */ 165 /* binop vAA, vBB, vCC */ 166 movzbl 2(rPC),%eax # eax <- BB 167 movzbl 3(rPC),%ecx # ecx <- CC 168 GET_VREG %eax, %eax # eax <- vBB 169 GET_VREG %ecx, %ecx # eax <- vBB 170 $instr # ex: addl %ecx,%eax 171 SET_VREG $result, rINST 172 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 173 174%def binop2addr(result="%eax", instr=""): 175/* 176 * Generic 32-bit "/2addr" binary operation. Provide an "instr" line 177 * that specifies an instruction that performs "result = r0 op r1". 178 * This could be an instruction or a function call. 179 * 180 * For: add-int/2addr, sub-int/2addr, mul-int/2addr, div-int/2addr, 181 * rem-int/2addr, and-int/2addr, or-int/2addr, xor-int/2addr, 182 * shl-int/2addr, shr-int/2addr, ushr-int/2addr, add-float/2addr, 183 * sub-float/2addr, mul-float/2addr, div-float/2addr, rem-float/2addr 184 */ 185 /* binop/2addr vA, vB */ 186 movzx rINSTbl, %ecx # ecx <- A+ 187 sarl $$4, rINST # rINST <- B 188 GET_VREG %eax, rINST # eax <- vB 189 andb $$0xf, %cl # ecx <- A 190 $instr %eax, VREG_ADDRESS(%ecx) 191 CLEAR_REF %ecx 192 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 193 194%def binopLit16(result="%eax", instr=""): 195/* 196 * Generic 32-bit "lit16" binary operation. Provide an "instr" line 197 * that specifies an instruction that performs "result = eax op ecx". 198 * This could be an x86 instruction or a function call. (If the result 199 * comes back in a register other than eax, you can override "result".) 200 * 201 * For: add-int/lit16, rsub-int, 202 * and-int/lit16, or-int/lit16, xor-int/lit16 203 */ 204 /* binop/lit16 vA, vB, #+CCCC */ 205 movzbl rINSTbl, %eax # eax <- 000000BA 206 sarl $$4, %eax # eax <- B 207 GET_VREG %eax, %eax # eax <- vB 208 movswl 2(rPC), %ecx # ecx <- ssssCCCC 209 andb $$0xf, rINSTbl # rINST <- A 210 $instr # for example: addl %ecx, %eax 211 SET_VREG $result, rINST 212 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 213 214%def binopLit8(result="%eax", instr=""): 215/* 216 * Generic 32-bit "lit8" binary operation. Provide an "instr" line 217 * that specifies an instruction that performs "result = eax op ecx". 218 * This could be an x86 instruction or a function call. (If the result 219 * comes back in a register other than r0, you can override "result".) 220 * 221 * For: add-int/lit8, rsub-int/lit8 222 * and-int/lit8, or-int/lit8, xor-int/lit8, 223 * shl-int/lit8, shr-int/lit8, ushr-int/lit8 224 */ 225 /* binop/lit8 vAA, vBB, #+CC */ 226 movzbl 2(rPC), %eax # eax <- BB 227 movsbl 3(rPC), %ecx # ecx <- ssssssCC 228 GET_VREG %eax, %eax # eax <- rBB 229 $instr # ex: addl %ecx,%eax 230 SET_VREG $result, rINST 231 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 232 233%def binopWide(instr1="", instr2=""): 234/* 235 * Generic 64-bit binary operation. 236 */ 237 /* binop vAA, vBB, vCC */ 238 movzbl 2(rPC), %eax # eax <- BB 239 movzbl 3(rPC), %ecx # ecx <- CC 240 movl rIBASE, LOCAL0(%esp) # save rIBASE 241 GET_VREG rIBASE, %eax # rIBASE <- v[BB+0] 242 GET_VREG_HIGH %eax, %eax # eax <- v[BB+1] 243 $instr1 VREG_ADDRESS(%ecx), rIBASE 244 $instr2 VREG_HIGH_ADDRESS(%ecx), %eax 245 SET_VREG rIBASE, rINST # v[AA+0] <- rIBASE 246 movl LOCAL0(%esp), rIBASE # restore rIBASE 247 SET_VREG_HIGH %eax, rINST # v[AA+1] <- eax 248 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 249 250%def binopWide2addr(instr1="", instr2=""): 251/* 252 * Generic 64-bit binary operation. 253 */ 254 /* binop/2addr vA, vB */ 255 movzbl rINSTbl, %ecx # ecx<- BA 256 sarl $$4, %ecx # ecx<- B 257 GET_VREG %eax, %ecx # eax<- v[B+0] 258 GET_VREG_HIGH %ecx, %ecx # eax<- v[B+1] 259 andb $$0xF, rINSTbl # rINST<- A 260 $instr1 %eax, VREG_ADDRESS(rINST) 261 $instr2 %ecx, VREG_HIGH_ADDRESS(rINST) 262 CLEAR_WIDE_REF rINST 263 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 264 265%def cvtfp_int(srcdouble="1", tgtlong="1"): 266/* On fp to int conversions, Java requires that 267 * if the result > maxint, it should be clamped to maxint. If it is less 268 * than minint, it should be clamped to minint. If it is a nan, the result 269 * should be zero. Further, the rounding mode is to truncate. This model 270 * differs from what is delivered normally via the x86 fpu, so we have 271 * to play some games. 272 */ 273 /* float/double to int/long vA, vB */ 274 movzbl rINSTbl, %ecx # ecx <- A+ 275 sarl $$4, rINST # rINST <- B 276 .if $srcdouble 277 fldl VREG_ADDRESS(rINST) # %st0 <- vB 278 .else 279 flds VREG_ADDRESS(rINST) # %st0 <- vB 280 .endif 281 ftst 282 fnstcw LOCAL0(%esp) # remember original rounding mode 283 movzwl LOCAL0(%esp), %eax 284 movb $$0xc, %ah 285 movw %ax, LOCAL0+2(%esp) 286 fldcw LOCAL0+2(%esp) # set "to zero" rounding mode 287 andb $$0xf, %cl # ecx <- A 288 .if $tgtlong 289 fistpll VREG_ADDRESS(%ecx) # convert and store 290 .else 291 fistpl VREG_ADDRESS(%ecx) # convert and store 292 .endif 293 fldcw LOCAL0(%esp) # restore previous rounding mode 294 .if $tgtlong 295 movl $$0x80000000, %eax 296 xorl VREG_HIGH_ADDRESS(%ecx), %eax 297 orl VREG_ADDRESS(%ecx), %eax 298 .else 299 cmpl $$0x80000000, VREG_ADDRESS(%ecx) 300 .endif 301 je .L${opcode}_special_case # fix up result 302 303.L${opcode}_finish: 304 xor %eax, %eax 305 mov %eax, VREG_REF_ADDRESS(%ecx) 306 .if $tgtlong 307 mov %eax, VREG_REF_HIGH_ADDRESS(%ecx) 308 .endif 309 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 310% add_slow_path(cvtfp_int_helper, tgtlong) 311 312%def cvtfp_int_helper(tgtlong): 313.L${opcode}_special_case: 314 fnstsw %ax 315 sahf 316 jp .L${opcode}_isNaN 317 adcl $$-1, VREG_ADDRESS(%ecx) 318 .if $tgtlong 319 adcl $$-1, VREG_HIGH_ADDRESS(%ecx) 320 .endif 321 jmp .L${opcode}_finish 322.L${opcode}_isNaN: 323 movl $$0, VREG_ADDRESS(%ecx) 324 .if $tgtlong 325 movl $$0, VREG_HIGH_ADDRESS(%ecx) 326 .endif 327 jmp .L${opcode}_finish 328 329%def shop2addr(result="%eax", instr=""): 330/* 331 * Generic 32-bit "shift/2addr" operation. 332 */ 333 /* shift/2addr vA, vB */ 334 movzx rINSTbl, %ecx # eax <- BA 335 sarl $$4, %ecx # ecx <- B 336 GET_VREG %ecx, %ecx # eax <- vBB 337 andb $$0xf, rINSTbl # rINST <- A 338 GET_VREG %eax, rINST # eax <- vAA 339 $instr # ex: sarl %cl, %eax 340 SET_VREG $result, rINST 341 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 342 343%def unop(instr=""): 344/* 345 * Generic 32-bit unary operation. Provide an "instr" line that 346 * specifies an instruction that performs "result = op eax". 347 */ 348 /* unop vA, vB */ 349 movzbl rINSTbl,%ecx # ecx <- A+ 350 sarl $$4,rINST # rINST <- B 351 GET_VREG %eax, rINST # eax <- vB 352 andb $$0xf,%cl # ecx <- A 353 $instr 354 SET_VREG %eax, %ecx 355 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 356 357%def op_add_int(): 358% binop(instr="addl") 359 360%def op_add_int_2addr(): 361% binop2addr(instr="addl") 362 363%def op_add_int_lit16(): 364% binopLit16(instr="addl %ecx, %eax") 365 366%def op_add_int_lit8(): 367% binopLit8(instr="addl %ecx, %eax") 368 369%def op_add_long(): 370% binopWide(instr1="addl", instr2="adcl") 371 372%def op_add_long_2addr(): 373% binopWide2addr(instr1="addl", instr2="adcl") 374 375%def op_and_int(): 376% binop(instr="andl") 377 378%def op_and_int_2addr(): 379% binop2addr(instr="andl") 380 381%def op_and_int_lit16(): 382% binopLit16(instr="andl %ecx, %eax") 383 384%def op_and_int_lit8(): 385% binopLit8(instr="andl %ecx, %eax") 386 387%def op_and_long(): 388% binopWide(instr1="andl", instr2="andl") 389 390%def op_and_long_2addr(): 391% binopWide2addr(instr1="andl", instr2="andl") 392 393%def op_cmp_long(): 394/* 395 * Compare two 64-bit values. Puts 0, 1, or -1 into the destination 396 * register based on the results of the comparison. 397 */ 398 /* cmp-long vAA, vBB, vCC */ 399 movzbl 2(rPC), %eax # eax <- BB 400 movzbl 3(rPC), %ecx # ecx <- CC 401 GET_VREG_HIGH %eax, %eax # eax <- v[BB+1], BB is clobbered 402 cmpl VREG_HIGH_ADDRESS(%ecx), %eax 403 jl .L${opcode}_smaller 404 jg .L${opcode}_bigger 405 movzbl 2(rPC), %eax # eax <- BB, restore BB 406 GET_VREG %eax, %eax # eax <- v[BB] 407 sub VREG_ADDRESS(%ecx), %eax 408 ja .L${opcode}_bigger 409 jb .L${opcode}_smaller 410.L${opcode}_finish: 411 SET_VREG %eax, rINST 412 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 413 414.L${opcode}_bigger: 415 movl $$1, %eax 416 jmp .L${opcode}_finish 417 418.L${opcode}_smaller: 419 movl $$-1, %eax 420 jmp .L${opcode}_finish 421 422%def op_div_int(): 423% bindiv(result="%eax", special="$0x80000000", rem="0") 424 425%def op_div_int_2addr(): 426% bindiv2addr(result="%eax", special="$0x80000000") 427 428%def op_div_int_lit16(): 429% bindivLit16(result="%eax", special="$0x80000000") 430 431%def op_div_int_lit8(): 432% bindivLit8(result="%eax", special="$0x80000000") 433 434%def op_div_long(routine="art_quick_ldiv"): 435/* art_quick_* methods has quick abi, 436 * so use eax, ecx, edx, ebx for args 437 */ 438 /* div vAA, vBB, vCC */ 439 .extern $routine 440 mov rIBASE, LOCAL0(%esp) # save rIBASE/%edx 441 mov rINST, LOCAL1(%esp) # save rINST/%ebx 442 movzbl 3(rPC), %eax # eax <- CC 443 GET_VREG %ecx, %eax 444 GET_VREG_HIGH %ebx, %eax 445 movl %ecx, %edx 446 orl %ebx, %ecx 447 jz common_errDivideByZero 448 movzbl 2(rPC), %eax # eax <- BB 449 GET_VREG_HIGH %ecx, %eax 450 GET_VREG %eax, %eax 451 call SYMBOL($routine) 452 mov LOCAL1(%esp), rINST # restore rINST/%ebx 453 SET_VREG_HIGH rIBASE, rINST 454 SET_VREG %eax, rINST 455 mov LOCAL0(%esp), rIBASE # restore rIBASE/%edx 456 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 457 458%def op_div_long_2addr(routine="art_quick_ldiv"): 459/* art_quick_* methods has quick abi, 460 * so use eax, ecx, edx, ebx for args 461 */ 462 /* div/2addr vA, vB */ 463 .extern $routine 464 mov rIBASE, LOCAL0(%esp) # save rIBASE/%edx 465 movzbl rINSTbl, %eax 466 shrl $$4, %eax # eax <- B 467 andb $$0xf, rINSTbl # rINST <- A 468 mov rINST, LOCAL1(%esp) # save rINST/%ebx 469 movl %ebx, %ecx 470 GET_VREG %edx, %eax 471 GET_VREG_HIGH %ebx, %eax 472 movl %edx, %eax 473 orl %ebx, %eax 474 jz common_errDivideByZero 475 GET_VREG %eax, %ecx 476 GET_VREG_HIGH %ecx, %ecx 477 call SYMBOL($routine) 478 mov LOCAL1(%esp), rINST # restore rINST/%ebx 479 SET_VREG_HIGH rIBASE, rINST 480 SET_VREG %eax, rINST 481 mov LOCAL0(%esp), rIBASE # restore rIBASE/%edx 482 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 483 484%def op_int_to_byte(): 485% unop(instr="movsbl %al, %eax") 486 487%def op_int_to_char(): 488% unop(instr="movzwl %ax,%eax") 489 490%def op_int_to_long(): 491 /* int to long vA, vB */ 492 movzbl rINSTbl, %eax # eax <- +A 493 sarl $$4, %eax # eax <- B 494 GET_VREG %eax, %eax # eax <- vB 495 andb $$0xf, rINSTbl # rINST <- A 496 movl rIBASE, %ecx # cltd trashes rIBASE/edx 497 cltd # rINST:eax<- sssssssBBBBBBBB 498 SET_VREG_HIGH rIBASE, rINST # v[A+1] <- rIBASE 499 SET_VREG %eax, rINST # v[A+0] <- %eax 500 movl %ecx, rIBASE 501 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 502 503 504%def op_int_to_short(): 505% unop(instr="movswl %ax, %eax") 506 507%def op_long_to_int(): 508/* we ignore the high word, making this equivalent to a 32-bit reg move */ 509% op_move() 510 511%def op_mul_int(): 512 /* 513 * 32-bit binary multiplication. 514 */ 515 /* mul vAA, vBB, vCC */ 516 movzbl 2(rPC), %eax # eax <- BB 517 movzbl 3(rPC), %ecx # ecx <- CC 518 GET_VREG %eax, %eax # eax <- vBB 519 mov rIBASE, LOCAL0(%esp) 520 imull VREG_ADDRESS(%ecx), %eax # trashes rIBASE/edx 521 mov LOCAL0(%esp), rIBASE 522 SET_VREG %eax, rINST 523 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 524 525%def op_mul_int_2addr(): 526 /* mul vA, vB */ 527 movzx rINSTbl, %ecx # ecx <- A+ 528 sarl $$4, rINST # rINST <- B 529 GET_VREG %eax, rINST # eax <- vB 530 andb $$0xf, %cl # ecx <- A 531 movl rIBASE, rINST 532 imull VREG_ADDRESS(%ecx), %eax # trashes rIBASE/edx 533 movl rINST, rIBASE 534 SET_VREG %eax, %ecx 535 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 536 537%def op_mul_int_lit16(): 538 /* mul/lit16 vA, vB, #+CCCC */ 539 /* Need A in rINST, ssssCCCC in ecx, vB in eax */ 540 movzbl rINSTbl, %eax # eax <- 000000BA 541 sarl $$4, %eax # eax <- B 542 GET_VREG %eax, %eax # eax <- vB 543 movl rIBASE, %ecx 544 movswl 2(rPC), rIBASE # rIBASE <- ssssCCCC 545 andb $$0xf, rINSTbl # rINST <- A 546 imull rIBASE, %eax # trashes rIBASE/edx 547 movl %ecx, rIBASE 548 SET_VREG %eax, rINST 549 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 550 551%def op_mul_int_lit8(): 552 /* mul/lit8 vAA, vBB, #+CC */ 553 movzbl 2(rPC), %eax # eax <- BB 554 movl rIBASE, %ecx 555 GET_VREG %eax, %eax # eax <- rBB 556 movsbl 3(rPC), rIBASE # rIBASE <- ssssssCC 557 imull rIBASE, %eax # trashes rIBASE/edx 558 movl %ecx, rIBASE 559 SET_VREG %eax, rINST 560 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 561 562%def op_mul_long(): 563/* 564 * Signed 64-bit integer multiply. 565 * 566 * We could definately use more free registers for 567 * this code. We spill rINSTw (ebx), 568 * giving us eax, ebc, ecx and edx as computational 569 * temps. On top of that, we'll spill edi (rFP) 570 * for use as the vB pointer and esi (rPC) for use 571 * as the vC pointer. Yuck. 572 * 573 */ 574 /* mul-long vAA, vBB, vCC */ 575 movzbl 2(rPC), %eax # eax <- B 576 movzbl 3(rPC), %ecx # ecx <- C 577 mov rPC, LOCAL0(%esp) # save Interpreter PC 578 mov rFP, LOCAL1(%esp) # save FP 579 mov rIBASE, LOCAL2(%esp) # save rIBASE 580 leal (rFP,%eax,4), %esi # esi <- &v[B] 581 leal VREG_ADDRESS(%ecx), rFP # rFP <- &v[C] 582 movl 4(%esi), %ecx # ecx <- Bmsw 583 imull (rFP), %ecx # ecx <- (Bmsw*Clsw) 584 movl 4(rFP), %eax # eax <- Cmsw 585 imull (%esi), %eax # eax <- (Cmsw*Blsw) 586 addl %eax, %ecx # ecx <- (Bmsw*Clsw)+(Cmsw*Blsw) 587 movl (rFP), %eax # eax <- Clsw 588 mull (%esi) # eax <- (Clsw*Alsw) 589 mov LOCAL0(%esp), rPC # restore Interpreter PC 590 mov LOCAL1(%esp), rFP # restore FP 591 leal (%ecx,rIBASE), rIBASE # full result now in rIBASE:%eax 592 SET_VREG_HIGH rIBASE, rINST # v[B+1] <- rIBASE 593 mov LOCAL2(%esp), rIBASE # restore IBASE 594 SET_VREG %eax, rINST # v[B] <- eax 595 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 596 597%def op_mul_long_2addr(): 598/* 599 * Signed 64-bit integer multiply, 2-addr version 600 * 601 * We could definately use more free registers for 602 * this code. We must spill %edx (rIBASE) because it 603 * is used by imul. We'll also spill rINST (ebx), 604 * giving us eax, ebc, ecx and rIBASE as computational 605 * temps. On top of that, we'll spill %esi (edi) 606 * for use as the vA pointer and rFP (esi) for use 607 * as the vB pointer. Yuck. 608 */ 609 /* mul-long/2addr vA, vB */ 610 movzbl rINSTbl, %eax # eax <- BA 611 andb $$0xf, %al # eax <- A 612 CLEAR_WIDE_REF %eax # clear refs in advance 613 sarl $$4, rINST # rINST <- B 614 mov rPC, LOCAL0(%esp) # save Interpreter PC 615 mov rFP, LOCAL1(%esp) # save FP 616 mov rIBASE, LOCAL2(%esp) # save rIBASE 617 leal (rFP,%eax,4), %esi # esi <- &v[A] 618 leal (rFP,rINST,4), rFP # rFP <- &v[B] 619 movl 4(%esi), %ecx # ecx <- Amsw 620 imull (rFP), %ecx # ecx <- (Amsw*Blsw) 621 movl 4(rFP), %eax # eax <- Bmsw 622 imull (%esi), %eax # eax <- (Bmsw*Alsw) 623 addl %eax, %ecx # ecx <- (Amsw*Blsw)+(Bmsw*Alsw) 624 movl (rFP), %eax # eax <- Blsw 625 mull (%esi) # eax <- (Blsw*Alsw) 626 leal (%ecx,rIBASE), rIBASE # full result now in %edx:%eax 627 movl rIBASE, 4(%esi) # v[A+1] <- rIBASE 628 movl %eax, (%esi) # v[A] <- %eax 629 mov LOCAL0(%esp), rPC # restore Interpreter PC 630 mov LOCAL2(%esp), rIBASE # restore IBASE 631 mov LOCAL1(%esp), rFP # restore FP 632 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 633 634%def op_neg_int(): 635% unop(instr="negl %eax") 636 637%def op_neg_long(): 638 /* unop vA, vB */ 639 movzbl rINSTbl, %ecx # ecx <- BA 640 sarl $$4, %ecx # ecx <- B 641 andb $$0xf, rINSTbl # rINST <- A 642 GET_VREG %eax, %ecx # eax <- v[B+0] 643 GET_VREG_HIGH %ecx, %ecx # ecx <- v[B+1] 644 negl %eax 645 adcl $$0, %ecx 646 negl %ecx 647 SET_VREG %eax, rINST # v[A+0] <- eax 648 SET_VREG_HIGH %ecx, rINST # v[A+1] <- ecx 649 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 650 651 652%def op_not_int(): 653% unop(instr="notl %eax") 654 655%def op_not_long(): 656 /* unop vA, vB */ 657 movzbl rINSTbl, %ecx # ecx <- BA 658 sarl $$4, %ecx # ecx <- B 659 andb $$0xf, rINSTbl # rINST <- A 660 GET_VREG %eax, %ecx # eax <- v[B+0] 661 GET_VREG_HIGH %ecx, %ecx # ecx <- v[B+1] 662 notl %eax 663 notl %ecx 664 SET_VREG %eax, rINST # v[A+0] <- eax 665 SET_VREG_HIGH %ecx, rINST # v[A+1] <- ecx 666 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 667 668%def op_or_int(): 669% binop(instr="orl") 670 671%def op_or_int_2addr(): 672% binop2addr(instr="orl") 673 674%def op_or_int_lit16(): 675% binopLit16(instr="orl %ecx, %eax") 676 677%def op_or_int_lit8(): 678% binopLit8(instr="orl %ecx, %eax") 679 680%def op_or_long(): 681% binopWide(instr1="orl", instr2="orl") 682 683%def op_or_long_2addr(): 684% binopWide2addr(instr1="orl", instr2="orl") 685 686%def op_rem_int(): 687% bindiv(result="rIBASE", special="$0", rem="1") 688 689%def op_rem_int_2addr(): 690% bindiv2addr(result="rIBASE", special="$0") 691 692%def op_rem_int_lit16(): 693% bindivLit16(result="rIBASE", special="$0") 694 695%def op_rem_int_lit8(): 696% bindivLit8(result="rIBASE", special="$0") 697 698%def op_rem_long(): 699% op_div_long(routine="art_quick_lmod") 700 701%def op_rem_long_2addr(): 702% op_div_long_2addr(routine="art_quick_lmod") 703 704%def op_rsub_int(): 705/* this op is "rsub-int", but can be thought of as "rsub-int/lit16" */ 706% binopLit16(instr="subl %eax, %ecx", result="%ecx") 707 708%def op_rsub_int_lit8(): 709% binopLit8(instr="subl %eax, %ecx", result="%ecx") 710 711%def op_shl_int(): 712% binop1(instr="sall %cl, %eax") 713 714%def op_shl_int_2addr(): 715% shop2addr(instr="sall %cl, %eax") 716 717%def op_shl_int_lit8(): 718% binopLit8(instr="sall %cl, %eax") 719 720%def op_shl_long(): 721/* 722 * Long integer shift. This is different from the generic 32/64-bit 723 * binary operations because vAA/vBB are 64-bit but vCC (the shift 724 * distance) is 32-bit. Also, Dalvik requires us to mask off the low 725 * 6 bits of the shift distance. x86 shifts automatically mask off 726 * the low 5 bits of %cl, so have to handle the 64 > shiftcount > 31 727 * case specially. 728 */ 729 /* shl-long vAA, vBB, vCC */ 730 /* ecx gets shift count */ 731 /* Need to spill rINST */ 732 /* rINSTw gets AA */ 733 movzbl 2(rPC), %eax # eax <- BB 734 movzbl 3(rPC), %ecx # ecx <- CC 735 movl rIBASE, LOCAL0(%esp) 736 GET_VREG_HIGH rIBASE, %eax # ecx <- v[BB+1] 737 GET_VREG %ecx, %ecx # ecx <- vCC 738 GET_VREG %eax, %eax # eax <- v[BB+0] 739 shldl %eax,rIBASE 740 sall %cl, %eax 741 testb $$32, %cl 742 je 2f 743 movl %eax, rIBASE 744 xorl %eax, %eax 7452: 746 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 747 movl LOCAL0(%esp), rIBASE 748 SET_VREG %eax, rINST # v[AA+0] <- %eax 749 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 750 751%def op_shl_long_2addr(): 752/* 753 * Long integer shift, 2addr version. vA is 64-bit value/result, vB is 754 * 32-bit shift distance. 755 */ 756 /* shl-long/2addr vA, vB */ 757 /* ecx gets shift count */ 758 /* Need to spill rIBASE */ 759 /* rINSTw gets AA */ 760 movzbl rINSTbl, %ecx # ecx <- BA 761 andb $$0xf, rINSTbl # rINST <- A 762 GET_VREG %eax, rINST # eax <- v[AA+0] 763 sarl $$4, %ecx # ecx <- B 764 movl rIBASE, LOCAL0(%esp) 765 GET_VREG_HIGH rIBASE, rINST # rIBASE <- v[AA+1] 766 GET_VREG %ecx, %ecx # ecx <- vBB 767 shldl %eax, rIBASE 768 sall %cl, %eax 769 testb $$32, %cl 770 je 2f 771 movl %eax, rIBASE 772 xorl %eax, %eax 7732: 774 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 775 movl LOCAL0(%esp), rIBASE 776 SET_VREG %eax, rINST # v[AA+0] <- eax 777 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 778 779%def op_shr_int(): 780% binop1(instr="sarl %cl, %eax") 781 782%def op_shr_int_2addr(): 783% shop2addr(instr="sarl %cl, %eax") 784 785%def op_shr_int_lit8(): 786% binopLit8(instr="sarl %cl, %eax") 787 788%def op_shr_long(): 789/* 790 * Long integer shift. This is different from the generic 32/64-bit 791 * binary operations because vAA/vBB are 64-bit but vCC (the shift 792 * distance) is 32-bit. Also, Dalvik requires us to mask off the low 793 * 6 bits of the shift distance. x86 shifts automatically mask off 794 * the low 5 bits of %cl, so have to handle the 64 > shiftcount > 31 795 * case specially. 796 */ 797 /* shr-long vAA, vBB, vCC */ 798 /* ecx gets shift count */ 799 /* Need to spill rIBASE */ 800 /* rINSTw gets AA */ 801 movzbl 2(rPC), %eax # eax <- BB 802 movzbl 3(rPC), %ecx # ecx <- CC 803 movl rIBASE, LOCAL0(%esp) 804 GET_VREG_HIGH rIBASE, %eax # rIBASE<- v[BB+1] 805 GET_VREG %ecx, %ecx # ecx <- vCC 806 GET_VREG %eax, %eax # eax <- v[BB+0] 807 shrdl rIBASE, %eax 808 sarl %cl, rIBASE 809 testb $$32, %cl 810 je 2f 811 movl rIBASE, %eax 812 sarl $$31, rIBASE 8132: 814 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 815 movl LOCAL0(%esp), rIBASE 816 SET_VREG %eax, rINST # v[AA+0] <- eax 817 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 818 819%def op_shr_long_2addr(): 820/* 821 * Long integer shift, 2addr version. vA is 64-bit value/result, vB is 822 * 32-bit shift distance. 823 */ 824 /* shl-long/2addr vA, vB */ 825 /* ecx gets shift count */ 826 /* Need to spill rIBASE */ 827 /* rINSTw gets AA */ 828 movzbl rINSTbl, %ecx # ecx <- BA 829 andb $$0xf, rINSTbl # rINST <- A 830 GET_VREG %eax, rINST # eax <- v[AA+0] 831 sarl $$4, %ecx # ecx <- B 832 movl rIBASE, LOCAL0(%esp) 833 GET_VREG_HIGH rIBASE, rINST # rIBASE <- v[AA+1] 834 GET_VREG %ecx, %ecx # ecx <- vBB 835 shrdl rIBASE, %eax 836 sarl %cl, rIBASE 837 testb $$32, %cl 838 je 2f 839 movl rIBASE, %eax 840 sarl $$31, rIBASE 8412: 842 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 843 movl LOCAL0(%esp), rIBASE 844 SET_VREG %eax, rINST # v[AA+0] <- eax 845 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 846 847%def op_sub_int(): 848% binop(instr="subl") 849 850%def op_sub_int_2addr(): 851% binop2addr(instr="subl") 852 853%def op_sub_long(): 854% binopWide(instr1="subl", instr2="sbbl") 855 856%def op_sub_long_2addr(): 857% binopWide2addr(instr1="subl", instr2="sbbl") 858 859%def op_ushr_int(): 860% binop1(instr="shrl %cl, %eax") 861 862%def op_ushr_int_2addr(): 863% shop2addr(instr="shrl %cl, %eax") 864 865%def op_ushr_int_lit8(): 866% binopLit8(instr="shrl %cl, %eax") 867 868%def op_ushr_long(): 869/* 870 * Long integer shift. This is different from the generic 32/64-bit 871 * binary operations because vAA/vBB are 64-bit but vCC (the shift 872 * distance) is 32-bit. Also, Dalvik requires us to mask off the low 873 * 6 bits of the shift distance. x86 shifts automatically mask off 874 * the low 5 bits of %cl, so have to handle the 64 > shiftcount > 31 875 * case specially. 876 */ 877 /* shr-long vAA, vBB, vCC */ 878 /* ecx gets shift count */ 879 /* Need to spill rIBASE */ 880 /* rINSTw gets AA */ 881 movzbl 2(rPC), %eax # eax <- BB 882 movzbl 3(rPC), %ecx # ecx <- CC 883 movl rIBASE, LOCAL0(%esp) 884 GET_VREG_HIGH rIBASE, %eax # rIBASE <- v[BB+1] 885 GET_VREG %ecx, %ecx # ecx <- vCC 886 GET_VREG %eax, %eax # eax <- v[BB+0] 887 shrdl rIBASE, %eax 888 shrl %cl, rIBASE 889 testb $$32, %cl 890 je 2f 891 movl rIBASE, %eax 892 xorl rIBASE, rIBASE 8932: 894 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 895 movl LOCAL0(%esp), rIBASE 896 SET_VREG %eax, rINST # v[BB+0] <- eax 897 ADVANCE_PC_FETCH_AND_GOTO_NEXT 2 898 899%def op_ushr_long_2addr(): 900/* 901 * Long integer shift, 2addr version. vA is 64-bit value/result, vB is 902 * 32-bit shift distance. 903 */ 904 /* shl-long/2addr vA, vB */ 905 /* ecx gets shift count */ 906 /* Need to spill rIBASE */ 907 /* rINSTw gets AA */ 908 movzbl rINSTbl, %ecx # ecx <- BA 909 andb $$0xf, rINSTbl # rINST <- A 910 GET_VREG %eax, rINST # eax <- v[AA+0] 911 sarl $$4, %ecx # ecx <- B 912 movl rIBASE, LOCAL0(%esp) 913 GET_VREG_HIGH rIBASE, rINST # rIBASE <- v[AA+1] 914 GET_VREG %ecx, %ecx # ecx <- vBB 915 shrdl rIBASE, %eax 916 shrl %cl, rIBASE 917 testb $$32, %cl 918 je 2f 919 movl rIBASE, %eax 920 xorl rIBASE, rIBASE 9212: 922 SET_VREG_HIGH rIBASE, rINST # v[AA+1] <- rIBASE 923 movl LOCAL0(%esp), rIBASE 924 SET_VREG %eax, rINST # v[AA+0] <- eax 925 ADVANCE_PC_FETCH_AND_GOTO_NEXT 1 926 927%def op_xor_int(): 928% binop(instr="xorl") 929 930%def op_xor_int_2addr(): 931% binop2addr(instr="xorl") 932 933%def op_xor_int_lit16(): 934% binopLit16(instr="xorl %ecx, %eax") 935 936%def op_xor_int_lit8(): 937% binopLit8(instr="xorl %ecx, %eax") 938 939%def op_xor_long(): 940% binopWide(instr1="xorl", instr2="xorl") 941 942%def op_xor_long_2addr(): 943% binopWide2addr(instr1="xorl", instr2="xorl") 944