CoCalc -- assembler

GitHub Repository: PojavLauncherTeam/openjdk-aarch32-jdk8u
Path: blob/jdk8u272-b10-aarch32-20201026/hotspot/src/cpu/x86/vm/assembler_x86.cpp
⁴⁸⁷⁸⁵ views
1
/*
2
 * Copyright (c) 1997, 2014, Oracle and/or its affiliates. All rights reserved.
3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4
 *
5
 * This code is free software; you can redistribute it and/or modify it
6
 * under the terms of the GNU General Public License version 2 only, as
7
 * published by the Free Software Foundation.
8
 *
9
 * This code is distributed in the hope that it will be useful, but WITHOUT
10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
12
 * version 2 for more details (a copy is included in the LICENSE file that
13
 * accompanied this code).
14
 *
15
 * You should have received a copy of the GNU General Public License version
16
 * 2 along with this work; if not, write to the Free Software Foundation,
17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18
 *
19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
20
 * or visit www.oracle.com if you need additional information or have any
21
 * questions.
22
 *
23
 */
24

25
#include "precompiled.hpp"
26
#include "asm/assembler.hpp"
27
#include "asm/assembler.inline.hpp"
28
#include "gc_interface/collectedHeap.inline.hpp"
29
#include "interpreter/interpreter.hpp"
30
#include "memory/cardTableModRefBS.hpp"
31
#include "memory/resourceArea.hpp"
32
#include "prims/methodHandles.hpp"
33
#include "runtime/biasedLocking.hpp"
34
#include "runtime/interfaceSupport.hpp"
35
#include "runtime/objectMonitor.hpp"
36
#include "runtime/os.hpp"
37
#include "runtime/sharedRuntime.hpp"
38
#include "runtime/stubRoutines.hpp"
39
#include "utilities/macros.hpp"
40
#if INCLUDE_ALL_GCS
41
#include "gc_implementation/g1/g1CollectedHeap.inline.hpp"
42
#include "gc_implementation/g1/g1SATBCardTableModRefBS.hpp"
43
#include "gc_implementation/g1/heapRegion.hpp"
44
#endif // INCLUDE_ALL_GCS
45

46
#ifdef PRODUCT
47
#define BLOCK_COMMENT(str) /* nothing */
48
#define STOP(error) stop(error)
49
#else
50
#define BLOCK_COMMENT(str) block_comment(str)
51
#define STOP(error) block_comment(error); stop(error)
52
#endif
53

54
#define BIND(label) bind(label); BLOCK_COMMENT(#label ":")
55
// Implementation of AddressLiteral
56

57
AddressLiteral::AddressLiteral(address target, relocInfo::relocType rtype) {
58
  _is_lval = false;
59
  _target = target;
60
  switch (rtype) {
61
  case relocInfo::oop_type:
62
  case relocInfo::metadata_type:
63
    // Oops are a special case. Normally they would be their own section
64
    // but in cases like icBuffer they are literals in the code stream that
65
    // we don't have a section for. We use none so that we get a literal address
66
    // which is always patchable.
67
    break;
68
  case relocInfo::external_word_type:
69
    _rspec = external_word_Relocation::spec(target);
70
    break;
71
  case relocInfo::internal_word_type:
72
    _rspec = internal_word_Relocation::spec(target);
73
    break;
74
  case relocInfo::opt_virtual_call_type:
75
    _rspec = opt_virtual_call_Relocation::spec();
76
    break;
77
  case relocInfo::static_call_type:
78
    _rspec = static_call_Relocation::spec();
79
    break;
80
  case relocInfo::runtime_call_type:
81
    _rspec = runtime_call_Relocation::spec();
82
    break;
83
  case relocInfo::poll_type:
84
  case relocInfo::poll_return_type:
85
    _rspec = Relocation::spec_simple(rtype);
86
    break;
87
  case relocInfo::none:
88
    break;
89
  default:
90
    ShouldNotReachHere();
91
    break;
92
  }
93
}
94

95
// Implementation of Address
96

97
#ifdef _LP64
98

99
Address Address::make_array(ArrayAddress adr) {
100
  // Not implementable on 64bit machines
101
  // Should have been handled higher up the call chain.
102
  ShouldNotReachHere();
103
  return Address();
104
}
105

106
// exceedingly dangerous constructor
107
Address::Address(int disp, address loc, relocInfo::relocType rtype) {
108
  _base  = noreg;
109
  _index = noreg;
110
  _scale = no_scale;
111
  _disp  = disp;
112
  switch (rtype) {
113
    case relocInfo::external_word_type:
114
      _rspec = external_word_Relocation::spec(loc);
115
      break;
116
    case relocInfo::internal_word_type:
117
      _rspec = internal_word_Relocation::spec(loc);
118
      break;
119
    case relocInfo::runtime_call_type:
120
      // HMM
121
      _rspec = runtime_call_Relocation::spec();
122
      break;
123
    case relocInfo::poll_type:
124
    case relocInfo::poll_return_type:
125
      _rspec = Relocation::spec_simple(rtype);
126
      break;
127
    case relocInfo::none:
128
      break;
129
    default:
130
      ShouldNotReachHere();
131
  }
132
}
133
#else // LP64
134

135
Address Address::make_array(ArrayAddress adr) {
136
  AddressLiteral base = adr.base();
137
  Address index = adr.index();
138
  assert(index._disp == 0, "must not have disp"); // maybe it can?
139
  Address array(index._base, index._index, index._scale, (intptr_t) base.target());
140
  array._rspec = base._rspec;
141
  return array;
142
}
143

144
// exceedingly dangerous constructor
145
Address::Address(address loc, RelocationHolder spec) {
146
  _base  = noreg;
147
  _index = noreg;
148
  _scale = no_scale;
149
  _disp  = (intptr_t) loc;
150
  _rspec = spec;
151
}
152

153
#endif // _LP64
154

155

156

157
// Convert the raw encoding form into the form expected by the constructor for
158
// Address.  An index of 4 (rsp) corresponds to having no index, so convert
159
// that to noreg for the Address constructor.
160
Address Address::make_raw(int base, int index, int scale, int disp, relocInfo::relocType disp_reloc) {
161
  RelocationHolder rspec;
162
  if (disp_reloc != relocInfo::none) {
163
    rspec = Relocation::spec_simple(disp_reloc);
164
  }
165
  bool valid_index = index != rsp->encoding();
166
  if (valid_index) {
167
    Address madr(as_Register(base), as_Register(index), (Address::ScaleFactor)scale, in_ByteSize(disp));
168
    madr._rspec = rspec;
169
    return madr;
170
  } else {
171
    Address madr(as_Register(base), noreg, Address::no_scale, in_ByteSize(disp));
172
    madr._rspec = rspec;
173
    return madr;
174
  }
175
}
176

177
// Implementation of Assembler
178

179
int AbstractAssembler::code_fill_byte() {
180
  return (u_char)'\xF4'; // hlt
181
}
182

183
// make this go away someday
184
void Assembler::emit_data(jint data, relocInfo::relocType rtype, int format) {
185
  if (rtype == relocInfo::none)
186
        emit_int32(data);
187
  else  emit_data(data, Relocation::spec_simple(rtype), format);
188
}
189

190
void Assembler::emit_data(jint data, RelocationHolder const& rspec, int format) {
191
  assert(imm_operand == 0, "default format must be immediate in this file");
192
  assert(inst_mark() != NULL, "must be inside InstructionMark");
193
  if (rspec.type() !=  relocInfo::none) {
194
    #ifdef ASSERT
195
      check_relocation(rspec, format);
196
    #endif
197
    // Do not use AbstractAssembler::relocate, which is not intended for
198
    // embedded words.  Instead, relocate to the enclosing instruction.
199

200
    // hack. call32 is too wide for mask so use disp32
201
    if (format == call32_operand)
202
      code_section()->relocate(inst_mark(), rspec, disp32_operand);
203
    else
204
      code_section()->relocate(inst_mark(), rspec, format);
205
  }
206
  emit_int32(data);
207
}
208

209
static int encode(Register r) {
210
  int enc = r->encoding();
211
  if (enc >= 8) {
212
    enc -= 8;
213
  }
214
  return enc;
215
}
216

217
void Assembler::emit_arith_b(int op1, int op2, Register dst, int imm8) {
218
  assert(dst->has_byte_register(), "must have byte register");
219
  assert(isByte(op1) && isByte(op2), "wrong opcode");
220
  assert(isByte(imm8), "not a byte");
221
  assert((op1 & 0x01) == 0, "should be 8bit operation");
222
  emit_int8(op1);
223
  emit_int8(op2 | encode(dst));
224
  emit_int8(imm8);
225
}
226

227

228
void Assembler::emit_arith(int op1, int op2, Register dst, int32_t imm32) {
229
  assert(isByte(op1) && isByte(op2), "wrong opcode");
230
  assert((op1 & 0x01) == 1, "should be 32bit operation");
231
  assert((op1 & 0x02) == 0, "sign-extension bit should not be set");
232
  if (is8bit(imm32)) {
233
    emit_int8(op1 | 0x02); // set sign bit
234
    emit_int8(op2 | encode(dst));
235
    emit_int8(imm32 & 0xFF);
236
  } else {
237
    emit_int8(op1);
238
    emit_int8(op2 | encode(dst));
239
    emit_int32(imm32);
240
  }
241
}
242

243
// Force generation of a 4 byte immediate value even if it fits into 8bit
244
void Assembler::emit_arith_imm32(int op1, int op2, Register dst, int32_t imm32) {
245
  assert(isByte(op1) && isByte(op2), "wrong opcode");
246
  assert((op1 & 0x01) == 1, "should be 32bit operation");
247
  assert((op1 & 0x02) == 0, "sign-extension bit should not be set");
248
  emit_int8(op1);
249
  emit_int8(op2 | encode(dst));
250
  emit_int32(imm32);
251
}
252

253
// immediate-to-memory forms
254
void Assembler::emit_arith_operand(int op1, Register rm, Address adr, int32_t imm32) {
255
  assert((op1 & 0x01) == 1, "should be 32bit operation");
256
  assert((op1 & 0x02) == 0, "sign-extension bit should not be set");
257
  if (is8bit(imm32)) {
258
    emit_int8(op1 | 0x02); // set sign bit
259
    emit_operand(rm, adr, 1);
260
    emit_int8(imm32 & 0xFF);
261
  } else {
262
    emit_int8(op1);
263
    emit_operand(rm, adr, 4);
264
    emit_int32(imm32);
265
  }
266
}
267

268

269
void Assembler::emit_arith(int op1, int op2, Register dst, Register src) {
270
  assert(isByte(op1) && isByte(op2), "wrong opcode");
271
  emit_int8(op1);
272
  emit_int8(op2 | encode(dst) << 3 | encode(src));
273
}
274

275

276
void Assembler::emit_operand(Register reg, Register base, Register index,
277
                             Address::ScaleFactor scale, int disp,
278
                             RelocationHolder const& rspec,
279
                             int rip_relative_correction) {
280
  relocInfo::relocType rtype = (relocInfo::relocType) rspec.type();
281

282
  // Encode the registers as needed in the fields they are used in
283

284
  int regenc = encode(reg) << 3;
285
  int indexenc = index->is_valid() ? encode(index) << 3 : 0;
286
  int baseenc = base->is_valid() ? encode(base) : 0;
287

288
  if (base->is_valid()) {
289
    if (index->is_valid()) {
290
      assert(scale != Address::no_scale, "inconsistent address");
291
      // [base + index*scale + disp]
292
      if (disp == 0 && rtype == relocInfo::none  &&
293
          base != rbp LP64_ONLY(&& base != r13)) {
294
        // [base + index*scale]
295
        // [00 reg 100][ss index base]
296
        assert(index != rsp, "illegal addressing mode");
297
        emit_int8(0x04 | regenc);
298
        emit_int8(scale << 6 | indexenc | baseenc);
299
      } else if (is8bit(disp) && rtype == relocInfo::none) {
300
        // [base + index*scale + imm8]
301
        // [01 reg 100][ss index base] imm8
302
        assert(index != rsp, "illegal addressing mode");
303
        emit_int8(0x44 | regenc);
304
        emit_int8(scale << 6 | indexenc | baseenc);
305
        emit_int8(disp & 0xFF);
306
      } else {
307
        // [base + index*scale + disp32]
308
        // [10 reg 100][ss index base] disp32
309
        assert(index != rsp, "illegal addressing mode");
310
        emit_int8(0x84 | regenc);
311
        emit_int8(scale << 6 | indexenc | baseenc);
312
        emit_data(disp, rspec, disp32_operand);
313
      }
314
    } else if (base == rsp LP64_ONLY(|| base == r12)) {
315
      // [rsp + disp]
316
      if (disp == 0 && rtype == relocInfo::none) {
317
        // [rsp]
318
        // [00 reg 100][00 100 100]
319
        emit_int8(0x04 | regenc);
320
        emit_int8(0x24);
321
      } else if (is8bit(disp) && rtype == relocInfo::none) {
322
        // [rsp + imm8]
323
        // [01 reg 100][00 100 100] disp8
324
        emit_int8(0x44 | regenc);
325
        emit_int8(0x24);
326
        emit_int8(disp & 0xFF);
327
      } else {
328
        // [rsp + imm32]
329
        // [10 reg 100][00 100 100] disp32
330
        emit_int8(0x84 | regenc);
331
        emit_int8(0x24);
332
        emit_data(disp, rspec, disp32_operand);
333
      }
334
    } else {
335
      // [base + disp]
336
      assert(base != rsp LP64_ONLY(&& base != r12), "illegal addressing mode");
337
      if (disp == 0 && rtype == relocInfo::none &&
338
          base != rbp LP64_ONLY(&& base != r13)) {
339
        // [base]
340
        // [00 reg base]
341
        emit_int8(0x00 | regenc | baseenc);
342
      } else if (is8bit(disp) && rtype == relocInfo::none) {
343
        // [base + disp8]
344
        // [01 reg base] disp8
345
        emit_int8(0x40 | regenc | baseenc);
346
        emit_int8(disp & 0xFF);
347
      } else {
348
        // [base + disp32]
349
        // [10 reg base] disp32
350
        emit_int8(0x80 | regenc | baseenc);
351
        emit_data(disp, rspec, disp32_operand);
352
      }
353
    }
354
  } else {
355
    if (index->is_valid()) {
356
      assert(scale != Address::no_scale, "inconsistent address");
357
      // [index*scale + disp]
358
      // [00 reg 100][ss index 101] disp32
359
      assert(index != rsp, "illegal addressing mode");
360
      emit_int8(0x04 | regenc);
361
      emit_int8(scale << 6 | indexenc | 0x05);
362
      emit_data(disp, rspec, disp32_operand);
363
    } else if (rtype != relocInfo::none ) {
364
      // [disp] (64bit) RIP-RELATIVE (32bit) abs
365
      // [00 000 101] disp32
366

367
      emit_int8(0x05 | regenc);
368
      // Note that the RIP-rel. correction applies to the generated
369
      // disp field, but _not_ to the target address in the rspec.
370

371
      // disp was created by converting the target address minus the pc
372
      // at the start of the instruction. That needs more correction here.
373
      // intptr_t disp = target - next_ip;
374
      assert(inst_mark() != NULL, "must be inside InstructionMark");
375
      address next_ip = pc() + sizeof(int32_t) + rip_relative_correction;
376
      int64_t adjusted = disp;
377
      // Do rip-rel adjustment for 64bit
378
      LP64_ONLY(adjusted -=  (next_ip - inst_mark()));
379
      assert(is_simm32(adjusted),
380
             "must be 32bit offset (RIP relative address)");
381
      emit_data((int32_t) adjusted, rspec, disp32_operand);
382

383
    } else {
384
      // 32bit never did this, did everything as the rip-rel/disp code above
385
      // [disp] ABSOLUTE
386
      // [00 reg 100][00 100 101] disp32
387
      emit_int8(0x04 | regenc);
388
      emit_int8(0x25);
389
      emit_data(disp, rspec, disp32_operand);
390
    }
391
  }
392
}
393

394
void Assembler::emit_operand(XMMRegister reg, Register base, Register index,
395
                             Address::ScaleFactor scale, int disp,
396
                             RelocationHolder const& rspec) {
397
  emit_operand((Register)reg, base, index, scale, disp, rspec);
398
}
399

400
// Secret local extension to Assembler::WhichOperand:
401
#define end_pc_operand (_WhichOperand_limit)
402

403
address Assembler::locate_operand(address inst, WhichOperand which) {
404
  // Decode the given instruction, and return the address of
405
  // an embedded 32-bit operand word.
406

407
  // If "which" is disp32_operand, selects the displacement portion
408
  // of an effective address specifier.
409
  // If "which" is imm64_operand, selects the trailing immediate constant.
410
  // If "which" is call32_operand, selects the displacement of a call or jump.
411
  // Caller is responsible for ensuring that there is such an operand,
412
  // and that it is 32/64 bits wide.
413

414
  // If "which" is end_pc_operand, find the end of the instruction.
415

416
  address ip = inst;
417
  bool is_64bit = false;
418

419
  debug_only(bool has_disp32 = false);
420
  int tail_size = 0; // other random bytes (#32, #16, etc.) at end of insn
421

422
  again_after_prefix:
423
  switch (0xFF & *ip++) {
424

425
  // These convenience macros generate groups of "case" labels for the switch.
426
#define REP4(x) (x)+0: case (x)+1: case (x)+2: case (x)+3
427
#define REP8(x) (x)+0: case (x)+1: case (x)+2: case (x)+3: \
428
             case (x)+4: case (x)+5: case (x)+6: case (x)+7
429
#define REP16(x) REP8((x)+0): \
430
              case REP8((x)+8)
431

432
  case CS_segment:
433
  case SS_segment:
434
  case DS_segment:
435
  case ES_segment:
436
  case FS_segment:
437
  case GS_segment:
438
    // Seems dubious
439
    LP64_ONLY(assert(false, "shouldn't have that prefix"));
440
    assert(ip == inst+1, "only one prefix allowed");
441
    goto again_after_prefix;
442

443
  case 0x67:
444
  case REX:
445
  case REX_B:
446
  case REX_X:
447
  case REX_XB:
448
  case REX_R:
449
  case REX_RB:
450
  case REX_RX:
451
  case REX_RXB:
452
    NOT_LP64(assert(false, "64bit prefixes"));
453
    goto again_after_prefix;
454

455
  case REX_W:
456
  case REX_WB:
457
  case REX_WX:
458
  case REX_WXB:
459
  case REX_WR:
460
  case REX_WRB:
461
  case REX_WRX:
462
  case REX_WRXB:
463
    NOT_LP64(assert(false, "64bit prefixes"));
464
    is_64bit = true;
465
    goto again_after_prefix;
466

467
  case 0xFF: // pushq a; decl a; incl a; call a; jmp a
468
  case 0x88: // movb a, r
469
  case 0x89: // movl a, r
470
  case 0x8A: // movb r, a
471
  case 0x8B: // movl r, a
472
  case 0x8F: // popl a
473
    debug_only(has_disp32 = true);
474
    break;
475

476
  case 0x68: // pushq #32
477
    if (which == end_pc_operand) {
478
      return ip + 4;
479
    }
480
    assert(which == imm_operand && !is_64bit, "pushl has no disp32 or 64bit immediate");
481
    return ip;                  // not produced by emit_operand
482

483
  case 0x66: // movw ... (size prefix)
484
    again_after_size_prefix2:
485
    switch (0xFF & *ip++) {
486
    case REX:
487
    case REX_B:
488
    case REX_X:
489
    case REX_XB:
490
    case REX_R:
491
    case REX_RB:
492
    case REX_RX:
493
    case REX_RXB:
494
    case REX_W:
495
    case REX_WB:
496
    case REX_WX:
497
    case REX_WXB:
498
    case REX_WR:
499
    case REX_WRB:
500
    case REX_WRX:
501
    case REX_WRXB:
502
      NOT_LP64(assert(false, "64bit prefix found"));
503
      goto again_after_size_prefix2;
504
    case 0x8B: // movw r, a
505
    case 0x89: // movw a, r
506
      debug_only(has_disp32 = true);
507
      break;
508
    case 0xC7: // movw a, #16
509
      debug_only(has_disp32 = true);
510
      tail_size = 2;  // the imm16
511
      break;
512
    case 0x0F: // several SSE/SSE2 variants
513
      ip--;    // reparse the 0x0F
514
      goto again_after_prefix;
515
    default:
516
      ShouldNotReachHere();
517
    }
518
    break;
519

520
  case REP8(0xB8): // movl/q r, #32/#64(oop?)
521
    if (which == end_pc_operand)  return ip + (is_64bit ? 8 : 4);
522
    // these asserts are somewhat nonsensical
523
#ifndef _LP64
524
    assert(which == imm_operand || which == disp32_operand,
525
           err_msg("which %d is_64_bit %d ip " INTPTR_FORMAT, which, is_64bit, p2i(ip)));
526
#else
527
    assert((which == call32_operand || which == imm_operand) && is_64bit ||
528
           which == narrow_oop_operand && !is_64bit,
529
           err_msg("which %d is_64_bit %d ip " INTPTR_FORMAT, which, is_64bit, p2i(ip)));
530
#endif // _LP64
531
    return ip;
532

533
  case 0x69: // imul r, a, #32
534
  case 0xC7: // movl a, #32(oop?)
535
    tail_size = 4;
536
    debug_only(has_disp32 = true); // has both kinds of operands!
537
    break;
538

539
  case 0x0F: // movx..., etc.
540
    switch (0xFF & *ip++) {
541
    case 0x3A: // pcmpestri
542
      tail_size = 1;
543
    case 0x38: // ptest, pmovzxbw
544
      ip++; // skip opcode
545
      debug_only(has_disp32 = true); // has both kinds of operands!
546
      break;
547

548
    case 0x70: // pshufd r, r/a, #8
549
      debug_only(has_disp32 = true); // has both kinds of operands!
550
    case 0x73: // psrldq r, #8
551
      tail_size = 1;
552
      break;
553

554
    case 0x12: // movlps
555
    case 0x28: // movaps
556
    case 0x2E: // ucomiss
557
    case 0x2F: // comiss
558
    case 0x54: // andps
559
    case 0x55: // andnps
560
    case 0x56: // orps
561
    case 0x57: // xorps
562
    case 0x6E: // movd
563
    case 0x7E: // movd
564
    case 0xAE: // ldmxcsr, stmxcsr, fxrstor, fxsave, clflush
565
      debug_only(has_disp32 = true);
566
      break;
567

568
    case 0xAD: // shrd r, a, %cl
569
    case 0xAF: // imul r, a
570
    case 0xBE: // movsbl r, a (movsxb)
571
    case 0xBF: // movswl r, a (movsxw)
572
    case 0xB6: // movzbl r, a (movzxb)
573
    case 0xB7: // movzwl r, a (movzxw)
574
    case REP16(0x40): // cmovl cc, r, a
575
    case 0xB0: // cmpxchgb
576
    case 0xB1: // cmpxchg
577
    case 0xC1: // xaddl
578
    case 0xC7: // cmpxchg8
579
    case REP16(0x90): // setcc a
580
      debug_only(has_disp32 = true);
581
      // fall out of the switch to decode the address
582
      break;
583

584
    case 0xC4: // pinsrw r, a, #8
585
      debug_only(has_disp32 = true);
586
    case 0xC5: // pextrw r, r, #8
587
      tail_size = 1;  // the imm8
588
      break;
589

590
    case 0xAC: // shrd r, a, #8
591
      debug_only(has_disp32 = true);
592
      tail_size = 1;  // the imm8
593
      break;
594

595
    case REP16(0x80): // jcc rdisp32
596
      if (which == end_pc_operand)  return ip + 4;
597
      assert(which == call32_operand, "jcc has no disp32 or imm");
598
      return ip;
599
    default:
600
      ShouldNotReachHere();
601
    }
602
    break;
603

604
  case 0x81: // addl a, #32; addl r, #32
605
    // also: orl, adcl, sbbl, andl, subl, xorl, cmpl
606
    // on 32bit in the case of cmpl, the imm might be an oop
607
    tail_size = 4;
608
    debug_only(has_disp32 = true); // has both kinds of operands!
609
    break;
610

611
  case 0x83: // addl a, #8; addl r, #8
612
    // also: orl, adcl, sbbl, andl, subl, xorl, cmpl
613
    debug_only(has_disp32 = true); // has both kinds of operands!
614
    tail_size = 1;
615
    break;
616

617
  case 0x9B:
618
    switch (0xFF & *ip++) {
619
    case 0xD9: // fnstcw a
620
      debug_only(has_disp32 = true);
621
      break;
622
    default:
623
      ShouldNotReachHere();
624
    }
625
    break;
626

627
  case REP4(0x00): // addb a, r; addl a, r; addb r, a; addl r, a
628
  case REP4(0x10): // adc...
629
  case REP4(0x20): // and...
630
  case REP4(0x30): // xor...
631
  case REP4(0x08): // or...
632
  case REP4(0x18): // sbb...
633
  case REP4(0x28): // sub...
634
  case 0xF7: // mull a
635
  case 0x8D: // lea r, a
636
  case 0x87: // xchg r, a
637
  case REP4(0x38): // cmp...
638
  case 0x85: // test r, a
639
    debug_only(has_disp32 = true); // has both kinds of operands!
640
    break;
641

642
  case 0xC1: // sal a, #8; sar a, #8; shl a, #8; shr a, #8
643
  case 0xC6: // movb a, #8
644
  case 0x80: // cmpb a, #8
645
  case 0x6B: // imul r, a, #8
646
    debug_only(has_disp32 = true); // has both kinds of operands!
647
    tail_size = 1; // the imm8
648
    break;
649

650
  case 0xC4: // VEX_3bytes
651
  case 0xC5: // VEX_2bytes
652
    assert((UseAVX > 0), "shouldn't have VEX prefix");
653
    assert(ip == inst+1, "no prefixes allowed");
654
    // C4 and C5 are also used as opcodes for PINSRW and PEXTRW instructions
655
    // but they have prefix 0x0F and processed when 0x0F processed above.
656
    //
657
    // In 32-bit mode the VEX first byte C4 and C5 alias onto LDS and LES
658
    // instructions (these instructions are not supported in 64-bit mode).
659
    // To distinguish them bits [7:6] are set in the VEX second byte since
660
    // ModRM byte can not be of the form 11xxxxxx in 32-bit mode. To set
661
    // those VEX bits REX and vvvv bits are inverted.
662
    //
663
    // Fortunately C2 doesn't generate these instructions so we don't need
664
    // to check for them in product version.
665

666
    // Check second byte
667
    NOT_LP64(assert((0xC0 & *ip) == 0xC0, "shouldn't have LDS and LES instructions"));
668

669
    // First byte
670
    if ((0xFF & *inst) == VEX_3bytes) {
671
      ip++; // third byte
672
      is_64bit = ((VEX_W & *ip) == VEX_W);
673
    }
674
    ip++; // opcode
675
    // To find the end of instruction (which == end_pc_operand).
676
    switch (0xFF & *ip) {
677
    case 0x61: // pcmpestri r, r/a, #8
678
    case 0x70: // pshufd r, r/a, #8
679
    case 0x73: // psrldq r, #8
680
      tail_size = 1;  // the imm8
681
      break;
682
    default:
683
      break;
684
    }
685
    ip++; // skip opcode
686
    debug_only(has_disp32 = true); // has both kinds of operands!
687
    break;
688

689
  case 0xD1: // sal a, 1; sar a, 1; shl a, 1; shr a, 1
690
  case 0xD3: // sal a, %cl; sar a, %cl; shl a, %cl; shr a, %cl
691
  case 0xD9: // fld_s a; fst_s a; fstp_s a; fldcw a
692
  case 0xDD: // fld_d a; fst_d a; fstp_d a
693
  case 0xDB: // fild_s a; fistp_s a; fld_x a; fstp_x a
694
  case 0xDF: // fild_d a; fistp_d a
695
  case 0xD8: // fadd_s a; fsubr_s a; fmul_s a; fdivr_s a; fcomp_s a
696
  case 0xDC: // fadd_d a; fsubr_d a; fmul_d a; fdivr_d a; fcomp_d a
697
  case 0xDE: // faddp_d a; fsubrp_d a; fmulp_d a; fdivrp_d a; fcompp_d a
698
    debug_only(has_disp32 = true);
699
    break;
700

701
  case 0xE8: // call rdisp32
702
  case 0xE9: // jmp  rdisp32
703
    if (which == end_pc_operand)  return ip + 4;
704
    assert(which == call32_operand, "call has no disp32 or imm");
705
    return ip;
706

707
  case 0xF0:                    // Lock
708
    assert(os::is_MP(), "only on MP");
709
    goto again_after_prefix;
710

711
  case 0xF3:                    // For SSE
712
  case 0xF2:                    // For SSE2
713
    switch (0xFF & *ip++) {
714
    case REX:
715
    case REX_B:
716
    case REX_X:
717
    case REX_XB:
718
    case REX_R:
719
    case REX_RB:
720
    case REX_RX:
721
    case REX_RXB:
722
    case REX_W:
723
    case REX_WB:
724
    case REX_WX:
725
    case REX_WXB:
726
    case REX_WR:
727
    case REX_WRB:
728
    case REX_WRX:
729
    case REX_WRXB:
730
      NOT_LP64(assert(false, "found 64bit prefix"));
731
      ip++;
732
    default:
733
      ip++;
734
    }
735
    debug_only(has_disp32 = true); // has both kinds of operands!
736
    break;
737

738
  default:
739
    ShouldNotReachHere();
740

741
#undef REP8
742
#undef REP16
743
  }
744

745
  assert(which != call32_operand, "instruction is not a call, jmp, or jcc");
746
#ifdef _LP64
747
  assert(which != imm_operand, "instruction is not a movq reg, imm64");
748
#else
749
  // assert(which != imm_operand || has_imm32, "instruction has no imm32 field");
750
  assert(which != imm_operand || has_disp32, "instruction has no imm32 field");
751
#endif // LP64
752
  assert(which != disp32_operand || has_disp32, "instruction has no disp32 field");
753

754
  // parse the output of emit_operand
755
  int op2 = 0xFF & *ip++;
756
  int base = op2 & 0x07;
757
  int op3 = -1;
758
  const int b100 = 4;
759
  const int b101 = 5;
760
  if (base == b100 && (op2 >> 6) != 3) {
761
    op3 = 0xFF & *ip++;
762
    base = op3 & 0x07;   // refetch the base
763
  }
764
  // now ip points at the disp (if any)
765

766
  switch (op2 >> 6) {
767
  case 0:
768
    // [00 reg  100][ss index base]
769
    // [00 reg  100][00   100  esp]
770
    // [00 reg base]
771
    // [00 reg  100][ss index  101][disp32]
772
    // [00 reg  101]               [disp32]
773

774
    if (base == b101) {
775
      if (which == disp32_operand)
776
        return ip;              // caller wants the disp32
777
      ip += 4;                  // skip the disp32
778
    }
779
    break;
780

781
  case 1:
782
    // [01 reg  100][ss index base][disp8]
783
    // [01 reg  100][00   100  esp][disp8]
784
    // [01 reg base]               [disp8]
785
    ip += 1;                    // skip the disp8
786
    break;
787

788
  case 2:
789
    // [10 reg  100][ss index base][disp32]
790
    // [10 reg  100][00   100  esp][disp32]
791
    // [10 reg base]               [disp32]
792
    if (which == disp32_operand)
793
      return ip;                // caller wants the disp32
794
    ip += 4;                    // skip the disp32
795
    break;
796

797
  case 3:
798
    // [11 reg base]  (not a memory addressing mode)
799
    break;
800
  }
801

802
  if (which == end_pc_operand) {
803
    return ip + tail_size;
804
  }
805

806
#ifdef _LP64
807
  assert(which == narrow_oop_operand && !is_64bit, "instruction is not a movl adr, imm32");
808
#else
809
  assert(which == imm_operand, "instruction has only an imm field");
810
#endif // LP64
811
  return ip;
812
}
813

814
address Assembler::locate_next_instruction(address inst) {
815
  // Secretly share code with locate_operand:
816
  return locate_operand(inst, end_pc_operand);
817
}
818

819

820
#ifdef ASSERT
821
void Assembler::check_relocation(RelocationHolder const& rspec, int format) {
822
  address inst = inst_mark();
823
  assert(inst != NULL && inst < pc(), "must point to beginning of instruction");
824
  address opnd;
825

826
  Relocation* r = rspec.reloc();
827
  if (r->type() == relocInfo::none) {
828
    return;
829
  } else if (r->is_call() || format == call32_operand) {
830
    // assert(format == imm32_operand, "cannot specify a nonzero format");
831
    opnd = locate_operand(inst, call32_operand);
832
  } else if (r->is_data()) {
833
    assert(format == imm_operand || format == disp32_operand
834
           LP64_ONLY(|| format == narrow_oop_operand), "format ok");
835
    opnd = locate_operand(inst, (WhichOperand)format);
836
  } else {
837
    assert(format == imm_operand, "cannot specify a format");
838
    return;
839
  }
840
  assert(opnd == pc(), "must put operand where relocs can find it");
841
}
842
#endif // ASSERT
843

844
void Assembler::emit_operand32(Register reg, Address adr) {
845
  assert(reg->encoding() < 8, "no extended registers");
846
  assert(!adr.base_needs_rex() && !adr.index_needs_rex(), "no extended registers");
847
  emit_operand(reg, adr._base, adr._index, adr._scale, adr._disp,
848
               adr._rspec);
849
}
850

851
void Assembler::emit_operand(Register reg, Address adr,
852
                             int rip_relative_correction) {
853
  emit_operand(reg, adr._base, adr._index, adr._scale, adr._disp,
854
               adr._rspec,
855
               rip_relative_correction);
856
}
857

858
void Assembler::emit_operand(XMMRegister reg, Address adr) {
859
  emit_operand(reg, adr._base, adr._index, adr._scale, adr._disp,
860
               adr._rspec);
861
}
862

863
// MMX operations
864
void Assembler::emit_operand(MMXRegister reg, Address adr) {
865
  assert(!adr.base_needs_rex() && !adr.index_needs_rex(), "no extended registers");
866
  emit_operand((Register)reg, adr._base, adr._index, adr._scale, adr._disp, adr._rspec);
867
}
868

869
// work around gcc (3.2.1-7a) bug
870
void Assembler::emit_operand(Address adr, MMXRegister reg) {
871
  assert(!adr.base_needs_rex() && !adr.index_needs_rex(), "no extended registers");
872
  emit_operand((Register)reg, adr._base, adr._index, adr._scale, adr._disp, adr._rspec);
873
}
874

875

876
void Assembler::emit_farith(int b1, int b2, int i) {
877
  assert(isByte(b1) && isByte(b2), "wrong opcode");
878
  assert(0 <= i &&  i < 8, "illegal stack offset");
879
  emit_int8(b1);
880
  emit_int8(b2 + i);
881
}
882

883

884
// Now the Assembler instructions (identical for 32/64 bits)
885

886
void Assembler::adcl(Address dst, int32_t imm32) {
887
  InstructionMark im(this);
888
  prefix(dst);
889
  emit_arith_operand(0x81, rdx, dst, imm32);
890
}
891

892
void Assembler::adcl(Address dst, Register src) {
893
  InstructionMark im(this);
894
  prefix(dst, src);
895
  emit_int8(0x11);
896
  emit_operand(src, dst);
897
}
898

899
void Assembler::adcl(Register dst, int32_t imm32) {
900
  prefix(dst);
901
  emit_arith(0x81, 0xD0, dst, imm32);
902
}
903

904
void Assembler::adcl(Register dst, Address src) {
905
  InstructionMark im(this);
906
  prefix(src, dst);
907
  emit_int8(0x13);
908
  emit_operand(dst, src);
909
}
910

911
void Assembler::adcl(Register dst, Register src) {
912
  (void) prefix_and_encode(dst->encoding(), src->encoding());
913
  emit_arith(0x13, 0xC0, dst, src);
914
}
915

916
void Assembler::addl(Address dst, int32_t imm32) {
917
  InstructionMark im(this);
918
  prefix(dst);
919
  emit_arith_operand(0x81, rax, dst, imm32);
920
}
921

922
void Assembler::addl(Address dst, Register src) {
923
  InstructionMark im(this);
924
  prefix(dst, src);
925
  emit_int8(0x01);
926
  emit_operand(src, dst);
927
}
928

929
void Assembler::addl(Register dst, int32_t imm32) {
930
  prefix(dst);
931
  emit_arith(0x81, 0xC0, dst, imm32);
932
}
933

934
void Assembler::addl(Register dst, Address src) {
935
  InstructionMark im(this);
936
  prefix(src, dst);
937
  emit_int8(0x03);
938
  emit_operand(dst, src);
939
}
940

941
void Assembler::addl(Register dst, Register src) {
942
  (void) prefix_and_encode(dst->encoding(), src->encoding());
943
  emit_arith(0x03, 0xC0, dst, src);
944
}
945

946
void Assembler::addr_nop_4() {
947
  assert(UseAddressNop, "no CPU support");
948
  // 4 bytes: NOP DWORD PTR [EAX+0]
949
  emit_int8(0x0F);
950
  emit_int8(0x1F);
951
  emit_int8(0x40); // emit_rm(cbuf, 0x1, EAX_enc, EAX_enc);
952
  emit_int8(0);    // 8-bits offset (1 byte)
953
}
954

955
void Assembler::addr_nop_5() {
956
  assert(UseAddressNop, "no CPU support");
957
  // 5 bytes: NOP DWORD PTR [EAX+EAX*0+0] 8-bits offset
958
  emit_int8(0x0F);
959
  emit_int8(0x1F);
960
  emit_int8(0x44); // emit_rm(cbuf, 0x1, EAX_enc, 0x4);
961
  emit_int8(0x00); // emit_rm(cbuf, 0x0, EAX_enc, EAX_enc);
962
  emit_int8(0);    // 8-bits offset (1 byte)
963
}
964

965
void Assembler::addr_nop_7() {
966
  assert(UseAddressNop, "no CPU support");
967
  // 7 bytes: NOP DWORD PTR [EAX+0] 32-bits offset
968
  emit_int8(0x0F);
969
  emit_int8(0x1F);
970
  emit_int8((unsigned char)0x80);
971
                   // emit_rm(cbuf, 0x2, EAX_enc, EAX_enc);
972
  emit_int32(0);   // 32-bits offset (4 bytes)
973
}
974

975
void Assembler::addr_nop_8() {
976
  assert(UseAddressNop, "no CPU support");
977
  // 8 bytes: NOP DWORD PTR [EAX+EAX*0+0] 32-bits offset
978
  emit_int8(0x0F);
979
  emit_int8(0x1F);
980
  emit_int8((unsigned char)0x84);
981
                   // emit_rm(cbuf, 0x2, EAX_enc, 0x4);
982
  emit_int8(0x00); // emit_rm(cbuf, 0x0, EAX_enc, EAX_enc);
983
  emit_int32(0);   // 32-bits offset (4 bytes)
984
}
985

986
void Assembler::addsd(XMMRegister dst, XMMRegister src) {
987
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
988
  emit_simd_arith(0x58, dst, src, VEX_SIMD_F2);
989
}
990

991
void Assembler::addsd(XMMRegister dst, Address src) {
992
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
993
  emit_simd_arith(0x58, dst, src, VEX_SIMD_F2);
994
}
995

996
void Assembler::addss(XMMRegister dst, XMMRegister src) {
997
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
998
  emit_simd_arith(0x58, dst, src, VEX_SIMD_F3);
999
}
1000

1001
void Assembler::addss(XMMRegister dst, Address src) {
1002
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1003
  emit_simd_arith(0x58, dst, src, VEX_SIMD_F3);
1004
}
1005

1006
void Assembler::aesdec(XMMRegister dst, Address src) {
1007
  assert(VM_Version::supports_aes(), "");
1008
  InstructionMark im(this);
1009
  simd_prefix(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1010
  emit_int8((unsigned char)0xDE);
1011
  emit_operand(dst, src);
1012
}
1013

1014
void Assembler::aesdec(XMMRegister dst, XMMRegister src) {
1015
  assert(VM_Version::supports_aes(), "");
1016
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1017
  emit_int8((unsigned char)0xDE);
1018
  emit_int8(0xC0 | encode);
1019
}
1020

1021
void Assembler::aesdeclast(XMMRegister dst, Address src) {
1022
  assert(VM_Version::supports_aes(), "");
1023
  InstructionMark im(this);
1024
  simd_prefix(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1025
  emit_int8((unsigned char)0xDF);
1026
  emit_operand(dst, src);
1027
}
1028

1029
void Assembler::aesdeclast(XMMRegister dst, XMMRegister src) {
1030
  assert(VM_Version::supports_aes(), "");
1031
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1032
  emit_int8((unsigned char)0xDF);
1033
  emit_int8((unsigned char)(0xC0 | encode));
1034
}
1035

1036
void Assembler::aesenc(XMMRegister dst, Address src) {
1037
  assert(VM_Version::supports_aes(), "");
1038
  InstructionMark im(this);
1039
  simd_prefix(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1040
  emit_int8((unsigned char)0xDC);
1041
  emit_operand(dst, src);
1042
}
1043

1044
void Assembler::aesenc(XMMRegister dst, XMMRegister src) {
1045
  assert(VM_Version::supports_aes(), "");
1046
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1047
  emit_int8((unsigned char)0xDC);
1048
  emit_int8(0xC0 | encode);
1049
}
1050

1051
void Assembler::aesenclast(XMMRegister dst, Address src) {
1052
  assert(VM_Version::supports_aes(), "");
1053
  InstructionMark im(this);
1054
  simd_prefix(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1055
  emit_int8((unsigned char)0xDD);
1056
  emit_operand(dst, src);
1057
}
1058

1059
void Assembler::aesenclast(XMMRegister dst, XMMRegister src) {
1060
  assert(VM_Version::supports_aes(), "");
1061
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
1062
  emit_int8((unsigned char)0xDD);
1063
  emit_int8((unsigned char)(0xC0 | encode));
1064
}
1065

1066

1067
void Assembler::andl(Address dst, int32_t imm32) {
1068
  InstructionMark im(this);
1069
  prefix(dst);
1070
  emit_int8((unsigned char)0x81);
1071
  emit_operand(rsp, dst, 4);
1072
  emit_int32(imm32);
1073
}
1074

1075
void Assembler::andl(Register dst, int32_t imm32) {
1076
  prefix(dst);
1077
  emit_arith(0x81, 0xE0, dst, imm32);
1078
}
1079

1080
void Assembler::andl(Register dst, Address src) {
1081
  InstructionMark im(this);
1082
  prefix(src, dst);
1083
  emit_int8(0x23);
1084
  emit_operand(dst, src);
1085
}
1086

1087
void Assembler::andl(Register dst, Register src) {
1088
  (void) prefix_and_encode(dst->encoding(), src->encoding());
1089
  emit_arith(0x23, 0xC0, dst, src);
1090
}
1091

1092
void Assembler::andnl(Register dst, Register src1, Register src2) {
1093
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1094
  int encode = vex_prefix_0F38_and_encode(dst, src1, src2);
1095
  emit_int8((unsigned char)0xF2);
1096
  emit_int8((unsigned char)(0xC0 | encode));
1097
}
1098

1099
void Assembler::andnl(Register dst, Register src1, Address src2) {
1100
  InstructionMark im(this);
1101
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1102
  vex_prefix_0F38(dst, src1, src2);
1103
  emit_int8((unsigned char)0xF2);
1104
  emit_operand(dst, src2);
1105
}
1106

1107
void Assembler::bsfl(Register dst, Register src) {
1108
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1109
  emit_int8(0x0F);
1110
  emit_int8((unsigned char)0xBC);
1111
  emit_int8((unsigned char)(0xC0 | encode));
1112
}
1113

1114
void Assembler::bsrl(Register dst, Register src) {
1115
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1116
  emit_int8(0x0F);
1117
  emit_int8((unsigned char)0xBD);
1118
  emit_int8((unsigned char)(0xC0 | encode));
1119
}
1120

1121
void Assembler::bswapl(Register reg) { // bswap
1122
  int encode = prefix_and_encode(reg->encoding());
1123
  emit_int8(0x0F);
1124
  emit_int8((unsigned char)(0xC8 | encode));
1125
}
1126

1127
void Assembler::blsil(Register dst, Register src) {
1128
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1129
  int encode = vex_prefix_0F38_and_encode(rbx, dst, src);
1130
  emit_int8((unsigned char)0xF3);
1131
  emit_int8((unsigned char)(0xC0 | encode));
1132
}
1133

1134
void Assembler::blsil(Register dst, Address src) {
1135
  InstructionMark im(this);
1136
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1137
  vex_prefix_0F38(rbx, dst, src);
1138
  emit_int8((unsigned char)0xF3);
1139
  emit_operand(rbx, src);
1140
}
1141

1142
void Assembler::blsmskl(Register dst, Register src) {
1143
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1144
  int encode = vex_prefix_0F38_and_encode(rdx, dst, src);
1145
  emit_int8((unsigned char)0xF3);
1146
  emit_int8((unsigned char)(0xC0 | encode));
1147
}
1148

1149
void Assembler::blsmskl(Register dst, Address src) {
1150
  InstructionMark im(this);
1151
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1152
  vex_prefix_0F38(rdx, dst, src);
1153
  emit_int8((unsigned char)0xF3);
1154
  emit_operand(rdx, src);
1155
}
1156

1157
void Assembler::blsrl(Register dst, Register src) {
1158
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1159
  int encode = vex_prefix_0F38_and_encode(rcx, dst, src);
1160
  emit_int8((unsigned char)0xF3);
1161
  emit_int8((unsigned char)(0xC0 | encode));
1162
}
1163

1164
void Assembler::blsrl(Register dst, Address src) {
1165
  InstructionMark im(this);
1166
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
1167
  vex_prefix_0F38(rcx, dst, src);
1168
  emit_int8((unsigned char)0xF3);
1169
  emit_operand(rcx, src);
1170
}
1171

1172
void Assembler::call(Label& L, relocInfo::relocType rtype) {
1173
  // suspect disp32 is always good
1174
  int operand = LP64_ONLY(disp32_operand) NOT_LP64(imm_operand);
1175

1176
  if (L.is_bound()) {
1177
    const int long_size = 5;
1178
    int offs = (int)( target(L) - pc() );
1179
    assert(offs <= 0, "assembler error");
1180
    InstructionMark im(this);
1181
    // 1110 1000 #32-bit disp
1182
    emit_int8((unsigned char)0xE8);
1183
    emit_data(offs - long_size, rtype, operand);
1184
  } else {
1185
    InstructionMark im(this);
1186
    // 1110 1000 #32-bit disp
1187
    L.add_patch_at(code(), locator());
1188

1189
    emit_int8((unsigned char)0xE8);
1190
    emit_data(int(0), rtype, operand);
1191
  }
1192
}
1193

1194
void Assembler::call(Register dst) {
1195
  int encode = prefix_and_encode(dst->encoding());
1196
  emit_int8((unsigned char)0xFF);
1197
  emit_int8((unsigned char)(0xD0 | encode));
1198
}
1199

1200

1201
void Assembler::call(Address adr) {
1202
  InstructionMark im(this);
1203
  prefix(adr);
1204
  emit_int8((unsigned char)0xFF);
1205
  emit_operand(rdx, adr);
1206
}
1207

1208
void Assembler::call_literal(address entry, RelocationHolder const& rspec) {
1209
  assert(entry != NULL, "call most probably wrong");
1210
  InstructionMark im(this);
1211
  emit_int8((unsigned char)0xE8);
1212
  intptr_t disp = entry - (pc() + sizeof(int32_t));
1213
  assert(is_simm32(disp), "must be 32bit offset (call2)");
1214
  // Technically, should use call32_operand, but this format is
1215
  // implied by the fact that we're emitting a call instruction.
1216

1217
  int operand = LP64_ONLY(disp32_operand) NOT_LP64(call32_operand);
1218
  emit_data((int) disp, rspec, operand);
1219
}
1220

1221
void Assembler::cdql() {
1222
  emit_int8((unsigned char)0x99);
1223
}
1224

1225
void Assembler::cld() {
1226
  emit_int8((unsigned char)0xFC);
1227
}
1228

1229
void Assembler::cmovl(Condition cc, Register dst, Register src) {
1230
  NOT_LP64(guarantee(VM_Version::supports_cmov(), "illegal instruction"));
1231
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1232
  emit_int8(0x0F);
1233
  emit_int8(0x40 | cc);
1234
  emit_int8((unsigned char)(0xC0 | encode));
1235
}
1236

1237

1238
void Assembler::cmovl(Condition cc, Register dst, Address src) {
1239
  NOT_LP64(guarantee(VM_Version::supports_cmov(), "illegal instruction"));
1240
  prefix(src, dst);
1241
  emit_int8(0x0F);
1242
  emit_int8(0x40 | cc);
1243
  emit_operand(dst, src);
1244
}
1245

1246
void Assembler::cmpb(Address dst, int imm8) {
1247
  InstructionMark im(this);
1248
  prefix(dst);
1249
  emit_int8((unsigned char)0x80);
1250
  emit_operand(rdi, dst, 1);
1251
  emit_int8(imm8);
1252
}
1253

1254
void Assembler::cmpl(Address dst, int32_t imm32) {
1255
  InstructionMark im(this);
1256
  prefix(dst);
1257
  emit_int8((unsigned char)0x81);
1258
  emit_operand(rdi, dst, 4);
1259
  emit_int32(imm32);
1260
}
1261

1262
void Assembler::cmpl(Register dst, int32_t imm32) {
1263
  prefix(dst);
1264
  emit_arith(0x81, 0xF8, dst, imm32);
1265
}
1266

1267
void Assembler::cmpl(Register dst, Register src) {
1268
  (void) prefix_and_encode(dst->encoding(), src->encoding());
1269
  emit_arith(0x3B, 0xC0, dst, src);
1270
}
1271

1272

1273
void Assembler::cmpl(Register dst, Address  src) {
1274
  InstructionMark im(this);
1275
  prefix(src, dst);
1276
  emit_int8((unsigned char)0x3B);
1277
  emit_operand(dst, src);
1278
}
1279

1280
void Assembler::cmpw(Address dst, int imm16) {
1281
  InstructionMark im(this);
1282
  assert(!dst.base_needs_rex() && !dst.index_needs_rex(), "no extended registers");
1283
  emit_int8(0x66);
1284
  emit_int8((unsigned char)0x81);
1285
  emit_operand(rdi, dst, 2);
1286
  emit_int16(imm16);
1287
}
1288

1289
// The 32-bit cmpxchg compares the value at adr with the contents of rax,
1290
// and stores reg into adr if so; otherwise, the value at adr is loaded into rax,.
1291
// The ZF is set if the compared values were equal, and cleared otherwise.
1292
void Assembler::cmpxchgl(Register reg, Address adr) { // cmpxchg
1293
  InstructionMark im(this);
1294
  prefix(adr, reg);
1295
  emit_int8(0x0F);
1296
  emit_int8((unsigned char)0xB1);
1297
  emit_operand(reg, adr);
1298
}
1299

1300
void Assembler::comisd(XMMRegister dst, Address src) {
1301
  // NOTE: dbx seems to decode this as comiss even though the
1302
  // 0x66 is there. Strangly ucomisd comes out correct
1303
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1304
  emit_simd_arith_nonds(0x2F, dst, src, VEX_SIMD_66);
1305
}
1306

1307
void Assembler::comisd(XMMRegister dst, XMMRegister src) {
1308
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1309
  emit_simd_arith_nonds(0x2F, dst, src, VEX_SIMD_66);
1310
}
1311

1312
void Assembler::comiss(XMMRegister dst, Address src) {
1313
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1314
  emit_simd_arith_nonds(0x2F, dst, src, VEX_SIMD_NONE);
1315
}
1316

1317
void Assembler::comiss(XMMRegister dst, XMMRegister src) {
1318
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1319
  emit_simd_arith_nonds(0x2F, dst, src, VEX_SIMD_NONE);
1320
}
1321

1322
void Assembler::cpuid() {
1323
  emit_int8(0x0F);
1324
  emit_int8((unsigned char)0xA2);
1325
}
1326

1327
void Assembler::cvtdq2pd(XMMRegister dst, XMMRegister src) {
1328
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1329
  emit_simd_arith_nonds(0xE6, dst, src, VEX_SIMD_F3);
1330
}
1331

1332
void Assembler::cvtdq2ps(XMMRegister dst, XMMRegister src) {
1333
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1334
  emit_simd_arith_nonds(0x5B, dst, src, VEX_SIMD_NONE);
1335
}
1336

1337
void Assembler::cvtsd2ss(XMMRegister dst, XMMRegister src) {
1338
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1339
  emit_simd_arith(0x5A, dst, src, VEX_SIMD_F2);
1340
}
1341

1342
void Assembler::cvtsd2ss(XMMRegister dst, Address src) {
1343
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1344
  emit_simd_arith(0x5A, dst, src, VEX_SIMD_F2);
1345
}
1346

1347
void Assembler::cvtsi2sdl(XMMRegister dst, Register src) {
1348
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1349
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_F2);
1350
  emit_int8(0x2A);
1351
  emit_int8((unsigned char)(0xC0 | encode));
1352
}
1353

1354
void Assembler::cvtsi2sdl(XMMRegister dst, Address src) {
1355
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1356
  emit_simd_arith(0x2A, dst, src, VEX_SIMD_F2);
1357
}
1358

1359
void Assembler::cvtsi2ssl(XMMRegister dst, Register src) {
1360
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1361
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_F3);
1362
  emit_int8(0x2A);
1363
  emit_int8((unsigned char)(0xC0 | encode));
1364
}
1365

1366
void Assembler::cvtsi2ssl(XMMRegister dst, Address src) {
1367
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1368
  emit_simd_arith(0x2A, dst, src, VEX_SIMD_F3);
1369
}
1370

1371
void Assembler::cvtss2sd(XMMRegister dst, XMMRegister src) {
1372
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1373
  emit_simd_arith(0x5A, dst, src, VEX_SIMD_F3);
1374
}
1375

1376
void Assembler::cvtss2sd(XMMRegister dst, Address src) {
1377
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1378
  emit_simd_arith(0x5A, dst, src, VEX_SIMD_F3);
1379
}
1380

1381

1382
void Assembler::cvttsd2sil(Register dst, XMMRegister src) {
1383
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1384
  int encode = simd_prefix_and_encode(dst, src, VEX_SIMD_F2);
1385
  emit_int8(0x2C);
1386
  emit_int8((unsigned char)(0xC0 | encode));
1387
}
1388

1389
void Assembler::cvttss2sil(Register dst, XMMRegister src) {
1390
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1391
  int encode = simd_prefix_and_encode(dst, src, VEX_SIMD_F3);
1392
  emit_int8(0x2C);
1393
  emit_int8((unsigned char)(0xC0 | encode));
1394
}
1395

1396
void Assembler::decl(Address dst) {
1397
  // Don't use it directly. Use MacroAssembler::decrement() instead.
1398
  InstructionMark im(this);
1399
  prefix(dst);
1400
  emit_int8((unsigned char)0xFF);
1401
  emit_operand(rcx, dst);
1402
}
1403

1404
void Assembler::divsd(XMMRegister dst, Address src) {
1405
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1406
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_F2);
1407
}
1408

1409
void Assembler::divsd(XMMRegister dst, XMMRegister src) {
1410
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1411
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_F2);
1412
}
1413

1414
void Assembler::divss(XMMRegister dst, Address src) {
1415
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1416
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_F3);
1417
}
1418

1419
void Assembler::divss(XMMRegister dst, XMMRegister src) {
1420
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1421
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_F3);
1422
}
1423

1424
void Assembler::emms() {
1425
  NOT_LP64(assert(VM_Version::supports_mmx(), ""));
1426
  emit_int8(0x0F);
1427
  emit_int8(0x77);
1428
}
1429

1430
void Assembler::hlt() {
1431
  emit_int8((unsigned char)0xF4);
1432
}
1433

1434
void Assembler::idivl(Register src) {
1435
  int encode = prefix_and_encode(src->encoding());
1436
  emit_int8((unsigned char)0xF7);
1437
  emit_int8((unsigned char)(0xF8 | encode));
1438
}
1439

1440
void Assembler::divl(Register src) { // Unsigned
1441
  int encode = prefix_and_encode(src->encoding());
1442
  emit_int8((unsigned char)0xF7);
1443
  emit_int8((unsigned char)(0xF0 | encode));
1444
}
1445

1446
void Assembler::imull(Register dst, Register src) {
1447
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1448
  emit_int8(0x0F);
1449
  emit_int8((unsigned char)0xAF);
1450
  emit_int8((unsigned char)(0xC0 | encode));
1451
}
1452

1453

1454
void Assembler::imull(Register dst, Register src, int value) {
1455
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1456
  if (is8bit(value)) {
1457
    emit_int8(0x6B);
1458
    emit_int8((unsigned char)(0xC0 | encode));
1459
    emit_int8(value & 0xFF);
1460
  } else {
1461
    emit_int8(0x69);
1462
    emit_int8((unsigned char)(0xC0 | encode));
1463
    emit_int32(value);
1464
  }
1465
}
1466

1467
void Assembler::imull(Register dst, Address src) {
1468
  InstructionMark im(this);
1469
  prefix(src, dst);
1470
  emit_int8(0x0F);
1471
  emit_int8((unsigned char) 0xAF);
1472
  emit_operand(dst, src);
1473
}
1474

1475

1476
void Assembler::incl(Address dst) {
1477
  // Don't use it directly. Use MacroAssembler::increment() instead.
1478
  InstructionMark im(this);
1479
  prefix(dst);
1480
  emit_int8((unsigned char)0xFF);
1481
  emit_operand(rax, dst);
1482
}
1483

1484
void Assembler::jcc(Condition cc, Label& L, bool maybe_short) {
1485
  InstructionMark im(this);
1486
  assert((0 <= cc) && (cc < 16), "illegal cc");
1487
  if (L.is_bound()) {
1488
    address dst = target(L);
1489
    assert(dst != NULL, "jcc most probably wrong");
1490

1491
    const int short_size = 2;
1492
    const int long_size = 6;
1493
    intptr_t offs = (intptr_t)dst - (intptr_t)pc();
1494
    if (maybe_short && is8bit(offs - short_size)) {
1495
      // 0111 tttn #8-bit disp
1496
      emit_int8(0x70 | cc);
1497
      emit_int8((offs - short_size) & 0xFF);
1498
    } else {
1499
      // 0000 1111 1000 tttn #32-bit disp
1500
      assert(is_simm32(offs - long_size),
1501
             "must be 32bit offset (call4)");
1502
      emit_int8(0x0F);
1503
      emit_int8((unsigned char)(0x80 | cc));
1504
      emit_int32(offs - long_size);
1505
    }
1506
  } else {
1507
    // Note: could eliminate cond. jumps to this jump if condition
1508
    //       is the same however, seems to be rather unlikely case.
1509
    // Note: use jccb() if label to be bound is very close to get
1510
    //       an 8-bit displacement
1511
    L.add_patch_at(code(), locator());
1512
    emit_int8(0x0F);
1513
    emit_int8((unsigned char)(0x80 | cc));
1514
    emit_int32(0);
1515
  }
1516
}
1517

1518
void Assembler::jccb(Condition cc, Label& L) {
1519
  if (L.is_bound()) {
1520
    const int short_size = 2;
1521
    address entry = target(L);
1522
#ifdef ASSERT
1523
    intptr_t dist = (intptr_t)entry - ((intptr_t)pc() + short_size);
1524
    intptr_t delta = short_branch_delta();
1525
    if (delta != 0) {
1526
      dist += (dist < 0 ? (-delta) :delta);
1527
    }
1528
    assert(is8bit(dist), "Dispacement too large for a short jmp");
1529
#endif
1530
    intptr_t offs = (intptr_t)entry - (intptr_t)pc();
1531
    // 0111 tttn #8-bit disp
1532
    emit_int8(0x70 | cc);
1533
    emit_int8((offs - short_size) & 0xFF);
1534
  } else {
1535
    InstructionMark im(this);
1536
    L.add_patch_at(code(), locator());
1537
    emit_int8(0x70 | cc);
1538
    emit_int8(0);
1539
  }
1540
}
1541

1542
void Assembler::jmp(Address adr) {
1543
  InstructionMark im(this);
1544
  prefix(adr);
1545
  emit_int8((unsigned char)0xFF);
1546
  emit_operand(rsp, adr);
1547
}
1548

1549
void Assembler::jmp(Label& L, bool maybe_short) {
1550
  if (L.is_bound()) {
1551
    address entry = target(L);
1552
    assert(entry != NULL, "jmp most probably wrong");
1553
    InstructionMark im(this);
1554
    const int short_size = 2;
1555
    const int long_size = 5;
1556
    intptr_t offs = entry - pc();
1557
    if (maybe_short && is8bit(offs - short_size)) {
1558
      emit_int8((unsigned char)0xEB);
1559
      emit_int8((offs - short_size) & 0xFF);
1560
    } else {
1561
      emit_int8((unsigned char)0xE9);
1562
      emit_int32(offs - long_size);
1563
    }
1564
  } else {
1565
    // By default, forward jumps are always 32-bit displacements, since
1566
    // we can't yet know where the label will be bound.  If you're sure that
1567
    // the forward jump will not run beyond 256 bytes, use jmpb to
1568
    // force an 8-bit displacement.
1569
    InstructionMark im(this);
1570
    L.add_patch_at(code(), locator());
1571
    emit_int8((unsigned char)0xE9);
1572
    emit_int32(0);
1573
  }
1574
}
1575

1576
void Assembler::jmp(Register entry) {
1577
  int encode = prefix_and_encode(entry->encoding());
1578
  emit_int8((unsigned char)0xFF);
1579
  emit_int8((unsigned char)(0xE0 | encode));
1580
}
1581

1582
void Assembler::jmp_literal(address dest, RelocationHolder const& rspec) {
1583
  InstructionMark im(this);
1584
  emit_int8((unsigned char)0xE9);
1585
  assert(dest != NULL, "must have a target");
1586
  intptr_t disp = dest - (pc() + sizeof(int32_t));
1587
  assert(is_simm32(disp), "must be 32bit offset (jmp)");
1588
  emit_data(disp, rspec.reloc(), call32_operand);
1589
}
1590

1591
void Assembler::jmpb(Label& L) {
1592
  if (L.is_bound()) {
1593
    const int short_size = 2;
1594
    address entry = target(L);
1595
    assert(entry != NULL, "jmp most probably wrong");
1596
#ifdef ASSERT
1597
    intptr_t dist = (intptr_t)entry - ((intptr_t)pc() + short_size);
1598
    intptr_t delta = short_branch_delta();
1599
    if (delta != 0) {
1600
      dist += (dist < 0 ? (-delta) :delta);
1601
    }
1602
    assert(is8bit(dist), "Dispacement too large for a short jmp");
1603
#endif
1604
    intptr_t offs = entry - pc();
1605
    emit_int8((unsigned char)0xEB);
1606
    emit_int8((offs - short_size) & 0xFF);
1607
  } else {
1608
    InstructionMark im(this);
1609
    L.add_patch_at(code(), locator());
1610
    emit_int8((unsigned char)0xEB);
1611
    emit_int8(0);
1612
  }
1613
}
1614

1615
void Assembler::ldmxcsr( Address src) {
1616
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1617
  InstructionMark im(this);
1618
  prefix(src);
1619
  emit_int8(0x0F);
1620
  emit_int8((unsigned char)0xAE);
1621
  emit_operand(as_Register(2), src);
1622
}
1623

1624
void Assembler::leal(Register dst, Address src) {
1625
  InstructionMark im(this);
1626
#ifdef _LP64
1627
  emit_int8(0x67); // addr32
1628
  prefix(src, dst);
1629
#endif // LP64
1630
  emit_int8((unsigned char)0x8D);
1631
  emit_operand(dst, src);
1632
}
1633

1634
void Assembler::lfence() {
1635
  emit_int8(0x0F);
1636
  emit_int8((unsigned char)0xAE);
1637
  emit_int8((unsigned char)0xE8);
1638
}
1639

1640
void Assembler::lock() {
1641
  emit_int8((unsigned char)0xF0);
1642
}
1643

1644
void Assembler::lzcntl(Register dst, Register src) {
1645
  assert(VM_Version::supports_lzcnt(), "encoding is treated as BSR");
1646
  emit_int8((unsigned char)0xF3);
1647
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1648
  emit_int8(0x0F);
1649
  emit_int8((unsigned char)0xBD);
1650
  emit_int8((unsigned char)(0xC0 | encode));
1651
}
1652

1653
// Emit mfence instruction
1654
void Assembler::mfence() {
1655
  NOT_LP64(assert(VM_Version::supports_sse2(), "unsupported");)
1656
  emit_int8(0x0F);
1657
  emit_int8((unsigned char)0xAE);
1658
  emit_int8((unsigned char)0xF0);
1659
}
1660

1661
void Assembler::mov(Register dst, Register src) {
1662
  LP64_ONLY(movq(dst, src)) NOT_LP64(movl(dst, src));
1663
}
1664

1665
void Assembler::movapd(XMMRegister dst, XMMRegister src) {
1666
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1667
  emit_simd_arith_nonds(0x28, dst, src, VEX_SIMD_66);
1668
}
1669

1670
void Assembler::movaps(XMMRegister dst, XMMRegister src) {
1671
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1672
  emit_simd_arith_nonds(0x28, dst, src, VEX_SIMD_NONE);
1673
}
1674

1675
void Assembler::movlhps(XMMRegister dst, XMMRegister src) {
1676
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1677
  int encode = simd_prefix_and_encode(dst, src, src, VEX_SIMD_NONE);
1678
  emit_int8(0x16);
1679
  emit_int8((unsigned char)(0xC0 | encode));
1680
}
1681

1682
void Assembler::movb(Register dst, Address src) {
1683
  NOT_LP64(assert(dst->has_byte_register(), "must have byte register"));
1684
  InstructionMark im(this);
1685
  prefix(src, dst, true);
1686
  emit_int8((unsigned char)0x8A);
1687
  emit_operand(dst, src);
1688
}
1689

1690

1691
void Assembler::movb(Address dst, int imm8) {
1692
  InstructionMark im(this);
1693
   prefix(dst);
1694
  emit_int8((unsigned char)0xC6);
1695
  emit_operand(rax, dst, 1);
1696
  emit_int8(imm8);
1697
}
1698

1699

1700
void Assembler::movb(Address dst, Register src) {
1701
  assert(src->has_byte_register(), "must have byte register");
1702
  InstructionMark im(this);
1703
  prefix(dst, src, true);
1704
  emit_int8((unsigned char)0x88);
1705
  emit_operand(src, dst);
1706
}
1707

1708
void Assembler::movdl(XMMRegister dst, Register src) {
1709
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1710
  int encode = simd_prefix_and_encode(dst, src, VEX_SIMD_66);
1711
  emit_int8(0x6E);
1712
  emit_int8((unsigned char)(0xC0 | encode));
1713
}
1714

1715
void Assembler::movdl(Register dst, XMMRegister src) {
1716
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1717
  // swap src/dst to get correct prefix
1718
  int encode = simd_prefix_and_encode(src, dst, VEX_SIMD_66);
1719
  emit_int8(0x7E);
1720
  emit_int8((unsigned char)(0xC0 | encode));
1721
}
1722

1723
void Assembler::movdl(XMMRegister dst, Address src) {
1724
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1725
  InstructionMark im(this);
1726
  simd_prefix(dst, src, VEX_SIMD_66);
1727
  emit_int8(0x6E);
1728
  emit_operand(dst, src);
1729
}
1730

1731
void Assembler::movdl(Address dst, XMMRegister src) {
1732
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1733
  InstructionMark im(this);
1734
  simd_prefix(dst, src, VEX_SIMD_66);
1735
  emit_int8(0x7E);
1736
  emit_operand(src, dst);
1737
}
1738

1739
void Assembler::movdqa(XMMRegister dst, XMMRegister src) {
1740
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1741
  emit_simd_arith_nonds(0x6F, dst, src, VEX_SIMD_66);
1742
}
1743

1744
void Assembler::movdqa(XMMRegister dst, Address src) {
1745
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1746
  emit_simd_arith_nonds(0x6F, dst, src, VEX_SIMD_66);
1747
}
1748

1749
void Assembler::movdqu(XMMRegister dst, Address src) {
1750
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1751
  emit_simd_arith_nonds(0x6F, dst, src, VEX_SIMD_F3);
1752
}
1753

1754
void Assembler::movdqu(XMMRegister dst, XMMRegister src) {
1755
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1756
  emit_simd_arith_nonds(0x6F, dst, src, VEX_SIMD_F3);
1757
}
1758

1759
void Assembler::movdqu(Address dst, XMMRegister src) {
1760
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1761
  InstructionMark im(this);
1762
  simd_prefix(dst, src, VEX_SIMD_F3);
1763
  emit_int8(0x7F);
1764
  emit_operand(src, dst);
1765
}
1766

1767
// Move Unaligned 256bit Vector
1768
void Assembler::vmovdqu(XMMRegister dst, XMMRegister src) {
1769
  assert(UseAVX > 0, "");
1770
  bool vector256 = true;
1771
  int encode = vex_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_F3, vector256);
1772
  emit_int8(0x6F);
1773
  emit_int8((unsigned char)(0xC0 | encode));
1774
}
1775

1776
void Assembler::vmovdqu(XMMRegister dst, Address src) {
1777
  assert(UseAVX > 0, "");
1778
  InstructionMark im(this);
1779
  bool vector256 = true;
1780
  vex_prefix(dst, xnoreg, src, VEX_SIMD_F3, vector256);
1781
  emit_int8(0x6F);
1782
  emit_operand(dst, src);
1783
}
1784

1785
void Assembler::vmovdqu(Address dst, XMMRegister src) {
1786
  assert(UseAVX > 0, "");
1787
  InstructionMark im(this);
1788
  bool vector256 = true;
1789
  // swap src<->dst for encoding
1790
  assert(src != xnoreg, "sanity");
1791
  vex_prefix(src, xnoreg, dst, VEX_SIMD_F3, vector256);
1792
  emit_int8(0x7F);
1793
  emit_operand(src, dst);
1794
}
1795

1796
// Uses zero extension on 64bit
1797

1798
void Assembler::movl(Register dst, int32_t imm32) {
1799
  int encode = prefix_and_encode(dst->encoding());
1800
  emit_int8((unsigned char)(0xB8 | encode));
1801
  emit_int32(imm32);
1802
}
1803

1804
void Assembler::movl(Register dst, Register src) {
1805
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1806
  emit_int8((unsigned char)0x8B);
1807
  emit_int8((unsigned char)(0xC0 | encode));
1808
}
1809

1810
void Assembler::movl(Register dst, Address src) {
1811
  InstructionMark im(this);
1812
  prefix(src, dst);
1813
  emit_int8((unsigned char)0x8B);
1814
  emit_operand(dst, src);
1815
}
1816

1817
void Assembler::movl(Address dst, int32_t imm32) {
1818
  InstructionMark im(this);
1819
  prefix(dst);
1820
  emit_int8((unsigned char)0xC7);
1821
  emit_operand(rax, dst, 4);
1822
  emit_int32(imm32);
1823
}
1824

1825
void Assembler::movl(Address dst, Register src) {
1826
  InstructionMark im(this);
1827
  prefix(dst, src);
1828
  emit_int8((unsigned char)0x89);
1829
  emit_operand(src, dst);
1830
}
1831

1832
// New cpus require to use movsd and movss to avoid partial register stall
1833
// when loading from memory. But for old Opteron use movlpd instead of movsd.
1834
// The selection is done in MacroAssembler::movdbl() and movflt().
1835
void Assembler::movlpd(XMMRegister dst, Address src) {
1836
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1837
  emit_simd_arith(0x12, dst, src, VEX_SIMD_66);
1838
}
1839

1840
void Assembler::movq( MMXRegister dst, Address src ) {
1841
  assert( VM_Version::supports_mmx(), "" );
1842
  emit_int8(0x0F);
1843
  emit_int8(0x6F);
1844
  emit_operand(dst, src);
1845
}
1846

1847
void Assembler::movq( Address dst, MMXRegister src ) {
1848
  assert( VM_Version::supports_mmx(), "" );
1849
  emit_int8(0x0F);
1850
  emit_int8(0x7F);
1851
  // workaround gcc (3.2.1-7a) bug
1852
  // In that version of gcc with only an emit_operand(MMX, Address)
1853
  // gcc will tail jump and try and reverse the parameters completely
1854
  // obliterating dst in the process. By having a version available
1855
  // that doesn't need to swap the args at the tail jump the bug is
1856
  // avoided.
1857
  emit_operand(dst, src);
1858
}
1859

1860
void Assembler::movq(XMMRegister dst, Address src) {
1861
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1862
  InstructionMark im(this);
1863
  simd_prefix(dst, src, VEX_SIMD_F3);
1864
  emit_int8(0x7E);
1865
  emit_operand(dst, src);
1866
}
1867

1868
void Assembler::movq(Address dst, XMMRegister src) {
1869
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1870
  InstructionMark im(this);
1871
  simd_prefix(dst, src, VEX_SIMD_66);
1872
  emit_int8((unsigned char)0xD6);
1873
  emit_operand(src, dst);
1874
}
1875

1876
void Assembler::movsbl(Register dst, Address src) { // movsxb
1877
  InstructionMark im(this);
1878
  prefix(src, dst);
1879
  emit_int8(0x0F);
1880
  emit_int8((unsigned char)0xBE);
1881
  emit_operand(dst, src);
1882
}
1883

1884
void Assembler::movsbl(Register dst, Register src) { // movsxb
1885
  NOT_LP64(assert(src->has_byte_register(), "must have byte register"));
1886
  int encode = prefix_and_encode(dst->encoding(), src->encoding(), true);
1887
  emit_int8(0x0F);
1888
  emit_int8((unsigned char)0xBE);
1889
  emit_int8((unsigned char)(0xC0 | encode));
1890
}
1891

1892
void Assembler::movsd(XMMRegister dst, XMMRegister src) {
1893
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1894
  emit_simd_arith(0x10, dst, src, VEX_SIMD_F2);
1895
}
1896

1897
void Assembler::movsd(XMMRegister dst, Address src) {
1898
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1899
  emit_simd_arith_nonds(0x10, dst, src, VEX_SIMD_F2);
1900
}
1901

1902
void Assembler::movsd(Address dst, XMMRegister src) {
1903
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
1904
  InstructionMark im(this);
1905
  simd_prefix(dst, src, VEX_SIMD_F2);
1906
  emit_int8(0x11);
1907
  emit_operand(src, dst);
1908
}
1909

1910
void Assembler::movss(XMMRegister dst, XMMRegister src) {
1911
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1912
  emit_simd_arith(0x10, dst, src, VEX_SIMD_F3);
1913
}
1914

1915
void Assembler::movss(XMMRegister dst, Address src) {
1916
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1917
  emit_simd_arith_nonds(0x10, dst, src, VEX_SIMD_F3);
1918
}
1919

1920
void Assembler::movss(Address dst, XMMRegister src) {
1921
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
1922
  InstructionMark im(this);
1923
  simd_prefix(dst, src, VEX_SIMD_F3);
1924
  emit_int8(0x11);
1925
  emit_operand(src, dst);
1926
}
1927

1928
void Assembler::movswl(Register dst, Address src) { // movsxw
1929
  InstructionMark im(this);
1930
  prefix(src, dst);
1931
  emit_int8(0x0F);
1932
  emit_int8((unsigned char)0xBF);
1933
  emit_operand(dst, src);
1934
}
1935

1936
void Assembler::movswl(Register dst, Register src) { // movsxw
1937
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1938
  emit_int8(0x0F);
1939
  emit_int8((unsigned char)0xBF);
1940
  emit_int8((unsigned char)(0xC0 | encode));
1941
}
1942

1943
void Assembler::movw(Address dst, int imm16) {
1944
  InstructionMark im(this);
1945

1946
  emit_int8(0x66); // switch to 16-bit mode
1947
  prefix(dst);
1948
  emit_int8((unsigned char)0xC7);
1949
  emit_operand(rax, dst, 2);
1950
  emit_int16(imm16);
1951
}
1952

1953
void Assembler::movw(Register dst, Address src) {
1954
  InstructionMark im(this);
1955
  emit_int8(0x66);
1956
  prefix(src, dst);
1957
  emit_int8((unsigned char)0x8B);
1958
  emit_operand(dst, src);
1959
}
1960

1961
void Assembler::movw(Address dst, Register src) {
1962
  InstructionMark im(this);
1963
  emit_int8(0x66);
1964
  prefix(dst, src);
1965
  emit_int8((unsigned char)0x89);
1966
  emit_operand(src, dst);
1967
}
1968

1969
void Assembler::movzbl(Register dst, Address src) { // movzxb
1970
  InstructionMark im(this);
1971
  prefix(src, dst);
1972
  emit_int8(0x0F);
1973
  emit_int8((unsigned char)0xB6);
1974
  emit_operand(dst, src);
1975
}
1976

1977
void Assembler::movzbl(Register dst, Register src) { // movzxb
1978
  NOT_LP64(assert(src->has_byte_register(), "must have byte register"));
1979
  int encode = prefix_and_encode(dst->encoding(), src->encoding(), true);
1980
  emit_int8(0x0F);
1981
  emit_int8((unsigned char)0xB6);
1982
  emit_int8(0xC0 | encode);
1983
}
1984

1985
void Assembler::movzwl(Register dst, Address src) { // movzxw
1986
  InstructionMark im(this);
1987
  prefix(src, dst);
1988
  emit_int8(0x0F);
1989
  emit_int8((unsigned char)0xB7);
1990
  emit_operand(dst, src);
1991
}
1992

1993
void Assembler::movzwl(Register dst, Register src) { // movzxw
1994
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
1995
  emit_int8(0x0F);
1996
  emit_int8((unsigned char)0xB7);
1997
  emit_int8(0xC0 | encode);
1998
}
1999

2000
void Assembler::mull(Address src) {
2001
  InstructionMark im(this);
2002
  prefix(src);
2003
  emit_int8((unsigned char)0xF7);
2004
  emit_operand(rsp, src);
2005
}
2006

2007
void Assembler::mull(Register src) {
2008
  int encode = prefix_and_encode(src->encoding());
2009
  emit_int8((unsigned char)0xF7);
2010
  emit_int8((unsigned char)(0xE0 | encode));
2011
}
2012

2013
void Assembler::mulsd(XMMRegister dst, Address src) {
2014
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2015
  emit_simd_arith(0x59, dst, src, VEX_SIMD_F2);
2016
}
2017

2018
void Assembler::mulsd(XMMRegister dst, XMMRegister src) {
2019
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2020
  emit_simd_arith(0x59, dst, src, VEX_SIMD_F2);
2021
}
2022

2023
void Assembler::mulss(XMMRegister dst, Address src) {
2024
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2025
  emit_simd_arith(0x59, dst, src, VEX_SIMD_F3);
2026
}
2027

2028
void Assembler::mulss(XMMRegister dst, XMMRegister src) {
2029
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2030
  emit_simd_arith(0x59, dst, src, VEX_SIMD_F3);
2031
}
2032

2033
void Assembler::negl(Register dst) {
2034
  int encode = prefix_and_encode(dst->encoding());
2035
  emit_int8((unsigned char)0xF7);
2036
  emit_int8((unsigned char)(0xD8 | encode));
2037
}
2038

2039
void Assembler::nop(int i) {
2040
#ifdef ASSERT
2041
  assert(i > 0, " ");
2042
  // The fancy nops aren't currently recognized by debuggers making it a
2043
  // pain to disassemble code while debugging. If asserts are on clearly
2044
  // speed is not an issue so simply use the single byte traditional nop
2045
  // to do alignment.
2046

2047
  for (; i > 0 ; i--) emit_int8((unsigned char)0x90);
2048
  return;
2049

2050
#endif // ASSERT
2051

2052
  if (UseAddressNop && VM_Version::is_intel()) {
2053
    //
2054
    // Using multi-bytes nops "0x0F 0x1F [address]" for Intel
2055
    //  1: 0x90
2056
    //  2: 0x66 0x90
2057
    //  3: 0x66 0x66 0x90 (don't use "0x0F 0x1F 0x00" - need patching safe padding)
2058
    //  4: 0x0F 0x1F 0x40 0x00
2059
    //  5: 0x0F 0x1F 0x44 0x00 0x00
2060
    //  6: 0x66 0x0F 0x1F 0x44 0x00 0x00
2061
    //  7: 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00
2062
    //  8: 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2063
    //  9: 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2064
    // 10: 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2065
    // 11: 0x66 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2066

2067
    // The rest coding is Intel specific - don't use consecutive address nops
2068

2069
    // 12: 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x66 0x66 0x66 0x90
2070
    // 13: 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x66 0x66 0x66 0x90
2071
    // 14: 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x66 0x66 0x66 0x90
2072
    // 15: 0x66 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x66 0x66 0x66 0x90
2073

2074
    while(i >= 15) {
2075
      // For Intel don't generate consecutive addess nops (mix with regular nops)
2076
      i -= 15;
2077
      emit_int8(0x66);   // size prefix
2078
      emit_int8(0x66);   // size prefix
2079
      emit_int8(0x66);   // size prefix
2080
      addr_nop_8();
2081
      emit_int8(0x66);   // size prefix
2082
      emit_int8(0x66);   // size prefix
2083
      emit_int8(0x66);   // size prefix
2084
      emit_int8((unsigned char)0x90);
2085
                         // nop
2086
    }
2087
    switch (i) {
2088
      case 14:
2089
        emit_int8(0x66); // size prefix
2090
      case 13:
2091
        emit_int8(0x66); // size prefix
2092
      case 12:
2093
        addr_nop_8();
2094
        emit_int8(0x66); // size prefix
2095
        emit_int8(0x66); // size prefix
2096
        emit_int8(0x66); // size prefix
2097
        emit_int8((unsigned char)0x90);
2098
                         // nop
2099
        break;
2100
      case 11:
2101
        emit_int8(0x66); // size prefix
2102
      case 10:
2103
        emit_int8(0x66); // size prefix
2104
      case 9:
2105
        emit_int8(0x66); // size prefix
2106
      case 8:
2107
        addr_nop_8();
2108
        break;
2109
      case 7:
2110
        addr_nop_7();
2111
        break;
2112
      case 6:
2113
        emit_int8(0x66); // size prefix
2114
      case 5:
2115
        addr_nop_5();
2116
        break;
2117
      case 4:
2118
        addr_nop_4();
2119
        break;
2120
      case 3:
2121
        // Don't use "0x0F 0x1F 0x00" - need patching safe padding
2122
        emit_int8(0x66); // size prefix
2123
      case 2:
2124
        emit_int8(0x66); // size prefix
2125
      case 1:
2126
        emit_int8((unsigned char)0x90);
2127
                         // nop
2128
        break;
2129
      default:
2130
        assert(i == 0, " ");
2131
    }
2132
    return;
2133
  }
2134
  if (UseAddressNop && VM_Version::is_amd()) {
2135
    //
2136
    // Using multi-bytes nops "0x0F 0x1F [address]" for AMD.
2137
    //  1: 0x90
2138
    //  2: 0x66 0x90
2139
    //  3: 0x66 0x66 0x90 (don't use "0x0F 0x1F 0x00" - need patching safe padding)
2140
    //  4: 0x0F 0x1F 0x40 0x00
2141
    //  5: 0x0F 0x1F 0x44 0x00 0x00
2142
    //  6: 0x66 0x0F 0x1F 0x44 0x00 0x00
2143
    //  7: 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00
2144
    //  8: 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2145
    //  9: 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2146
    // 10: 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2147
    // 11: 0x66 0x66 0x66 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2148

2149
    // The rest coding is AMD specific - use consecutive address nops
2150

2151
    // 12: 0x66 0x0F 0x1F 0x44 0x00 0x00 0x66 0x0F 0x1F 0x44 0x00 0x00
2152
    // 13: 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00 0x66 0x0F 0x1F 0x44 0x00 0x00
2153
    // 14: 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00
2154
    // 15: 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x0F 0x1F 0x80 0x00 0x00 0x00 0x00
2155
    // 16: 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00 0x0F 0x1F 0x84 0x00 0x00 0x00 0x00 0x00
2156
    //     Size prefixes (0x66) are added for larger sizes
2157

2158
    while(i >= 22) {
2159
      i -= 11;
2160
      emit_int8(0x66); // size prefix
2161
      emit_int8(0x66); // size prefix
2162
      emit_int8(0x66); // size prefix
2163
      addr_nop_8();
2164
    }
2165
    // Generate first nop for size between 21-12
2166
    switch (i) {
2167
      case 21:
2168
        i -= 1;
2169
        emit_int8(0x66); // size prefix
2170
      case 20:
2171
      case 19:
2172
        i -= 1;
2173
        emit_int8(0x66); // size prefix
2174
      case 18:
2175
      case 17:
2176
        i -= 1;
2177
        emit_int8(0x66); // size prefix
2178
      case 16:
2179
      case 15:
2180
        i -= 8;
2181
        addr_nop_8();
2182
        break;
2183
      case 14:
2184
      case 13:
2185
        i -= 7;
2186
        addr_nop_7();
2187
        break;
2188
      case 12:
2189
        i -= 6;
2190
        emit_int8(0x66); // size prefix
2191
        addr_nop_5();
2192
        break;
2193
      default:
2194
        assert(i < 12, " ");
2195
    }
2196

2197
    // Generate second nop for size between 11-1
2198
    switch (i) {
2199
      case 11:
2200
        emit_int8(0x66); // size prefix
2201
      case 10:
2202
        emit_int8(0x66); // size prefix
2203
      case 9:
2204
        emit_int8(0x66); // size prefix
2205
      case 8:
2206
        addr_nop_8();
2207
        break;
2208
      case 7:
2209
        addr_nop_7();
2210
        break;
2211
      case 6:
2212
        emit_int8(0x66); // size prefix
2213
      case 5:
2214
        addr_nop_5();
2215
        break;
2216
      case 4:
2217
        addr_nop_4();
2218
        break;
2219
      case 3:
2220
        // Don't use "0x0F 0x1F 0x00" - need patching safe padding
2221
        emit_int8(0x66); // size prefix
2222
      case 2:
2223
        emit_int8(0x66); // size prefix
2224
      case 1:
2225
        emit_int8((unsigned char)0x90);
2226
                         // nop
2227
        break;
2228
      default:
2229
        assert(i == 0, " ");
2230
    }
2231
    return;
2232
  }
2233

2234
  // Using nops with size prefixes "0x66 0x90".
2235
  // From AMD Optimization Guide:
2236
  //  1: 0x90
2237
  //  2: 0x66 0x90
2238
  //  3: 0x66 0x66 0x90
2239
  //  4: 0x66 0x66 0x66 0x90
2240
  //  5: 0x66 0x66 0x90 0x66 0x90
2241
  //  6: 0x66 0x66 0x90 0x66 0x66 0x90
2242
  //  7: 0x66 0x66 0x66 0x90 0x66 0x66 0x90
2243
  //  8: 0x66 0x66 0x66 0x90 0x66 0x66 0x66 0x90
2244
  //  9: 0x66 0x66 0x90 0x66 0x66 0x90 0x66 0x66 0x90
2245
  // 10: 0x66 0x66 0x66 0x90 0x66 0x66 0x90 0x66 0x66 0x90
2246
  //
2247
  while(i > 12) {
2248
    i -= 4;
2249
    emit_int8(0x66); // size prefix
2250
    emit_int8(0x66);
2251
    emit_int8(0x66);
2252
    emit_int8((unsigned char)0x90);
2253
                     // nop
2254
  }
2255
  // 1 - 12 nops
2256
  if(i > 8) {
2257
    if(i > 9) {
2258
      i -= 1;
2259
      emit_int8(0x66);
2260
    }
2261
    i -= 3;
2262
    emit_int8(0x66);
2263
    emit_int8(0x66);
2264
    emit_int8((unsigned char)0x90);
2265
  }
2266
  // 1 - 8 nops
2267
  if(i > 4) {
2268
    if(i > 6) {
2269
      i -= 1;
2270
      emit_int8(0x66);
2271
    }
2272
    i -= 3;
2273
    emit_int8(0x66);
2274
    emit_int8(0x66);
2275
    emit_int8((unsigned char)0x90);
2276
  }
2277
  switch (i) {
2278
    case 4:
2279
      emit_int8(0x66);
2280
    case 3:
2281
      emit_int8(0x66);
2282
    case 2:
2283
      emit_int8(0x66);
2284
    case 1:
2285
      emit_int8((unsigned char)0x90);
2286
      break;
2287
    default:
2288
      assert(i == 0, " ");
2289
  }
2290
}
2291

2292
void Assembler::notl(Register dst) {
2293
  int encode = prefix_and_encode(dst->encoding());
2294
  emit_int8((unsigned char)0xF7);
2295
  emit_int8((unsigned char)(0xD0 | encode));
2296
}
2297

2298
void Assembler::orl(Address dst, int32_t imm32) {
2299
  InstructionMark im(this);
2300
  prefix(dst);
2301
  emit_arith_operand(0x81, rcx, dst, imm32);
2302
}
2303

2304
void Assembler::orl(Register dst, int32_t imm32) {
2305
  prefix(dst);
2306
  emit_arith(0x81, 0xC8, dst, imm32);
2307
}
2308

2309
void Assembler::orl(Register dst, Address src) {
2310
  InstructionMark im(this);
2311
  prefix(src, dst);
2312
  emit_int8(0x0B);
2313
  emit_operand(dst, src);
2314
}
2315

2316
void Assembler::orl(Register dst, Register src) {
2317
  (void) prefix_and_encode(dst->encoding(), src->encoding());
2318
  emit_arith(0x0B, 0xC0, dst, src);
2319
}
2320

2321
void Assembler::orl(Address dst, Register src) {
2322
  InstructionMark im(this);
2323
  prefix(dst, src);
2324
  emit_int8(0x09);
2325
  emit_operand(src, dst);
2326
}
2327

2328
void Assembler::packuswb(XMMRegister dst, Address src) {
2329
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2330
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2331
  emit_simd_arith(0x67, dst, src, VEX_SIMD_66);
2332
}
2333

2334
void Assembler::packuswb(XMMRegister dst, XMMRegister src) {
2335
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2336
  emit_simd_arith(0x67, dst, src, VEX_SIMD_66);
2337
}
2338

2339
void Assembler::vpackuswb(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
2340
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
2341
  emit_vex_arith(0x67, dst, nds, src, VEX_SIMD_66, vector256);
2342
}
2343

2344
void Assembler::vpermq(XMMRegister dst, XMMRegister src, int imm8, bool vector256) {
2345
  assert(VM_Version::supports_avx2(), "");
2346
  int encode = simd_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_3A, true, vector256);
2347
  emit_int8(0x00);
2348
  emit_int8(0xC0 | encode);
2349
  emit_int8(imm8);
2350
}
2351

2352
void Assembler::pause() {
2353
  emit_int8((unsigned char)0xF3);
2354
  emit_int8((unsigned char)0x90);
2355
}
2356

2357
void Assembler::pcmpestri(XMMRegister dst, Address src, int imm8) {
2358
  assert(VM_Version::supports_sse4_2(), "");
2359
  InstructionMark im(this);
2360
  simd_prefix(dst, src, VEX_SIMD_66, VEX_OPCODE_0F_3A);
2361
  emit_int8(0x61);
2362
  emit_operand(dst, src);
2363
  emit_int8(imm8);
2364
}
2365

2366
void Assembler::pcmpestri(XMMRegister dst, XMMRegister src, int imm8) {
2367
  assert(VM_Version::supports_sse4_2(), "");
2368
  int encode = simd_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_3A);
2369
  emit_int8(0x61);
2370
  emit_int8((unsigned char)(0xC0 | encode));
2371
  emit_int8(imm8);
2372
}
2373

2374
void Assembler::pextrd(Register dst, XMMRegister src, int imm8) {
2375
  assert(VM_Version::supports_sse4_1(), "");
2376
  int encode = simd_prefix_and_encode(as_XMMRegister(dst->encoding()), xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_3A, false);
2377
  emit_int8(0x16);
2378
  emit_int8((unsigned char)(0xC0 | encode));
2379
  emit_int8(imm8);
2380
}
2381

2382
void Assembler::pextrq(Register dst, XMMRegister src, int imm8) {
2383
  assert(VM_Version::supports_sse4_1(), "");
2384
  int encode = simd_prefix_and_encode(as_XMMRegister(dst->encoding()), xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_3A, true);
2385
  emit_int8(0x16);
2386
  emit_int8((unsigned char)(0xC0 | encode));
2387
  emit_int8(imm8);
2388
}
2389

2390
void Assembler::pinsrd(XMMRegister dst, Register src, int imm8) {
2391
  assert(VM_Version::supports_sse4_1(), "");
2392
  int encode = simd_prefix_and_encode(dst, dst, as_XMMRegister(src->encoding()), VEX_SIMD_66, VEX_OPCODE_0F_3A, false);
2393
  emit_int8(0x22);
2394
  emit_int8((unsigned char)(0xC0 | encode));
2395
  emit_int8(imm8);
2396
}
2397

2398
void Assembler::pinsrq(XMMRegister dst, Register src, int imm8) {
2399
  assert(VM_Version::supports_sse4_1(), "");
2400
  int encode = simd_prefix_and_encode(dst, dst, as_XMMRegister(src->encoding()), VEX_SIMD_66, VEX_OPCODE_0F_3A, true);
2401
  emit_int8(0x22);
2402
  emit_int8((unsigned char)(0xC0 | encode));
2403
  emit_int8(imm8);
2404
}
2405

2406
void Assembler::pmovzxbw(XMMRegister dst, Address src) {
2407
  assert(VM_Version::supports_sse4_1(), "");
2408
  InstructionMark im(this);
2409
  simd_prefix(dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2410
  emit_int8(0x30);
2411
  emit_operand(dst, src);
2412
}
2413

2414
void Assembler::pmovzxbw(XMMRegister dst, XMMRegister src) {
2415
  assert(VM_Version::supports_sse4_1(), "");
2416
  int encode = simd_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2417
  emit_int8(0x30);
2418
  emit_int8((unsigned char)(0xC0 | encode));
2419
}
2420

2421
// generic
2422
void Assembler::pop(Register dst) {
2423
  int encode = prefix_and_encode(dst->encoding());
2424
  emit_int8(0x58 | encode);
2425
}
2426

2427
void Assembler::popcntl(Register dst, Address src) {
2428
  assert(VM_Version::supports_popcnt(), "must support");
2429
  InstructionMark im(this);
2430
  emit_int8((unsigned char)0xF3);
2431
  prefix(src, dst);
2432
  emit_int8(0x0F);
2433
  emit_int8((unsigned char)0xB8);
2434
  emit_operand(dst, src);
2435
}
2436

2437
void Assembler::popcntl(Register dst, Register src) {
2438
  assert(VM_Version::supports_popcnt(), "must support");
2439
  emit_int8((unsigned char)0xF3);
2440
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
2441
  emit_int8(0x0F);
2442
  emit_int8((unsigned char)0xB8);
2443
  emit_int8((unsigned char)(0xC0 | encode));
2444
}
2445

2446
void Assembler::popf() {
2447
  emit_int8((unsigned char)0x9D);
2448
}
2449

2450
#ifndef _LP64 // no 32bit push/pop on amd64
2451
void Assembler::popl(Address dst) {
2452
  // NOTE: this will adjust stack by 8byte on 64bits
2453
  InstructionMark im(this);
2454
  prefix(dst);
2455
  emit_int8((unsigned char)0x8F);
2456
  emit_operand(rax, dst);
2457
}
2458
#endif
2459

2460
void Assembler::prefetch_prefix(Address src) {
2461
  prefix(src);
2462
  emit_int8(0x0F);
2463
}
2464

2465
void Assembler::prefetchnta(Address src) {
2466
  NOT_LP64(assert(VM_Version::supports_sse(), "must support"));
2467
  InstructionMark im(this);
2468
  prefetch_prefix(src);
2469
  emit_int8(0x18);
2470
  emit_operand(rax, src); // 0, src
2471
}
2472

2473
void Assembler::prefetchr(Address src) {
2474
  assert(VM_Version::supports_3dnow_prefetch(), "must support");
2475
  InstructionMark im(this);
2476
  prefetch_prefix(src);
2477
  emit_int8(0x0D);
2478
  emit_operand(rax, src); // 0, src
2479
}
2480

2481
void Assembler::prefetcht0(Address src) {
2482
  NOT_LP64(assert(VM_Version::supports_sse(), "must support"));
2483
  InstructionMark im(this);
2484
  prefetch_prefix(src);
2485
  emit_int8(0x18);
2486
  emit_operand(rcx, src); // 1, src
2487
}
2488

2489
void Assembler::prefetcht1(Address src) {
2490
  NOT_LP64(assert(VM_Version::supports_sse(), "must support"));
2491
  InstructionMark im(this);
2492
  prefetch_prefix(src);
2493
  emit_int8(0x18);
2494
  emit_operand(rdx, src); // 2, src
2495
}
2496

2497
void Assembler::prefetcht2(Address src) {
2498
  NOT_LP64(assert(VM_Version::supports_sse(), "must support"));
2499
  InstructionMark im(this);
2500
  prefetch_prefix(src);
2501
  emit_int8(0x18);
2502
  emit_operand(rbx, src); // 3, src
2503
}
2504

2505
void Assembler::prefetchw(Address src) {
2506
  assert(VM_Version::supports_3dnow_prefetch(), "must support");
2507
  InstructionMark im(this);
2508
  prefetch_prefix(src);
2509
  emit_int8(0x0D);
2510
  emit_operand(rcx, src); // 1, src
2511
}
2512

2513
void Assembler::prefix(Prefix p) {
2514
  emit_int8(p);
2515
}
2516

2517
void Assembler::pshufb(XMMRegister dst, XMMRegister src) {
2518
  assert(VM_Version::supports_ssse3(), "");
2519
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2520
  emit_int8(0x00);
2521
  emit_int8((unsigned char)(0xC0 | encode));
2522
}
2523

2524
void Assembler::pshufb(XMMRegister dst, Address src) {
2525
  assert(VM_Version::supports_ssse3(), "");
2526
  InstructionMark im(this);
2527
  simd_prefix(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2528
  emit_int8(0x00);
2529
  emit_operand(dst, src);
2530
}
2531

2532
void Assembler::pshufd(XMMRegister dst, XMMRegister src, int mode) {
2533
  assert(isByte(mode), "invalid value");
2534
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2535
  emit_simd_arith_nonds(0x70, dst, src, VEX_SIMD_66);
2536
  emit_int8(mode & 0xFF);
2537

2538
}
2539

2540
void Assembler::pshufd(XMMRegister dst, Address src, int mode) {
2541
  assert(isByte(mode), "invalid value");
2542
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2543
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2544
  InstructionMark im(this);
2545
  simd_prefix(dst, src, VEX_SIMD_66);
2546
  emit_int8(0x70);
2547
  emit_operand(dst, src);
2548
  emit_int8(mode & 0xFF);
2549
}
2550

2551
void Assembler::pshuflw(XMMRegister dst, XMMRegister src, int mode) {
2552
  assert(isByte(mode), "invalid value");
2553
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2554
  emit_simd_arith_nonds(0x70, dst, src, VEX_SIMD_F2);
2555
  emit_int8(mode & 0xFF);
2556
}
2557

2558
void Assembler::pshuflw(XMMRegister dst, Address src, int mode) {
2559
  assert(isByte(mode), "invalid value");
2560
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2561
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2562
  InstructionMark im(this);
2563
  simd_prefix(dst, src, VEX_SIMD_F2);
2564
  emit_int8(0x70);
2565
  emit_operand(dst, src);
2566
  emit_int8(mode & 0xFF);
2567
}
2568

2569
void Assembler::psrldq(XMMRegister dst, int shift) {
2570
  // Shift 128 bit value in xmm register by number of bytes.
2571
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2572
  int encode = simd_prefix_and_encode(xmm3, dst, dst, VEX_SIMD_66);
2573
  emit_int8(0x73);
2574
  emit_int8((unsigned char)(0xC0 | encode));
2575
  emit_int8(shift);
2576
}
2577

2578
void Assembler::pslldq(XMMRegister dst, int shift) {
2579
  // Shift left 128 bit value in xmm register by number of bytes.
2580
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2581
  int encode = simd_prefix_and_encode(xmm7, dst, dst, VEX_SIMD_66);
2582
  emit_int8(0x73);
2583
  emit_int8((unsigned char)(0xC0 | encode));
2584
  emit_int8(shift);
2585
}
2586

2587
void Assembler::ptest(XMMRegister dst, Address src) {
2588
  assert(VM_Version::supports_sse4_1(), "");
2589
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2590
  InstructionMark im(this);
2591
  simd_prefix(dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2592
  emit_int8(0x17);
2593
  emit_operand(dst, src);
2594
}
2595

2596
void Assembler::ptest(XMMRegister dst, XMMRegister src) {
2597
  assert(VM_Version::supports_sse4_1(), "");
2598
  int encode = simd_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
2599
  emit_int8(0x17);
2600
  emit_int8((unsigned char)(0xC0 | encode));
2601
}
2602

2603
void Assembler::vptest(XMMRegister dst, Address src) {
2604
  assert(VM_Version::supports_avx(), "");
2605
  InstructionMark im(this);
2606
  bool vector256 = true;
2607
  assert(dst != xnoreg, "sanity");
2608
  int dst_enc = dst->encoding();
2609
  // swap src<->dst for encoding
2610
  vex_prefix(src, 0, dst_enc, VEX_SIMD_66, VEX_OPCODE_0F_38, false, vector256);
2611
  emit_int8(0x17);
2612
  emit_operand(dst, src);
2613
}
2614

2615
void Assembler::vptest(XMMRegister dst, XMMRegister src) {
2616
  assert(VM_Version::supports_avx(), "");
2617
  bool vector256 = true;
2618
  int encode = vex_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_38);
2619
  emit_int8(0x17);
2620
  emit_int8((unsigned char)(0xC0 | encode));
2621
}
2622

2623
void Assembler::punpcklbw(XMMRegister dst, Address src) {
2624
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2625
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2626
  emit_simd_arith(0x60, dst, src, VEX_SIMD_66);
2627
}
2628

2629
void Assembler::punpcklbw(XMMRegister dst, XMMRegister src) {
2630
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2631
  emit_simd_arith(0x60, dst, src, VEX_SIMD_66);
2632
}
2633

2634
void Assembler::punpckldq(XMMRegister dst, Address src) {
2635
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2636
  assert((UseAVX > 0), "SSE mode requires address alignment 16 bytes");
2637
  emit_simd_arith(0x62, dst, src, VEX_SIMD_66);
2638
}
2639

2640
void Assembler::punpckldq(XMMRegister dst, XMMRegister src) {
2641
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2642
  emit_simd_arith(0x62, dst, src, VEX_SIMD_66);
2643
}
2644

2645
void Assembler::punpcklqdq(XMMRegister dst, XMMRegister src) {
2646
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2647
  emit_simd_arith(0x6C, dst, src, VEX_SIMD_66);
2648
}
2649

2650
void Assembler::push(int32_t imm32) {
2651
  // in 64bits we push 64bits onto the stack but only
2652
  // take a 32bit immediate
2653
  emit_int8(0x68);
2654
  emit_int32(imm32);
2655
}
2656

2657
void Assembler::push(Register src) {
2658
  int encode = prefix_and_encode(src->encoding());
2659

2660
  emit_int8(0x50 | encode);
2661
}
2662

2663
void Assembler::pushf() {
2664
  emit_int8((unsigned char)0x9C);
2665
}
2666

2667
#ifndef _LP64 // no 32bit push/pop on amd64
2668
void Assembler::pushl(Address src) {
2669
  // Note this will push 64bit on 64bit
2670
  InstructionMark im(this);
2671
  prefix(src);
2672
  emit_int8((unsigned char)0xFF);
2673
  emit_operand(rsi, src);
2674
}
2675
#endif
2676

2677
void Assembler::rcll(Register dst, int imm8) {
2678
  assert(isShiftCount(imm8), "illegal shift count");
2679
  int encode = prefix_and_encode(dst->encoding());
2680
  if (imm8 == 1) {
2681
    emit_int8((unsigned char)0xD1);
2682
    emit_int8((unsigned char)(0xD0 | encode));
2683
  } else {
2684
    emit_int8((unsigned char)0xC1);
2685
    emit_int8((unsigned char)0xD0 | encode);
2686
    emit_int8(imm8);
2687
  }
2688
}
2689

2690
void Assembler::rdtsc() {
2691
  emit_int8((unsigned char)0x0F);
2692
  emit_int8((unsigned char)0x31);
2693
}
2694

2695
// copies data from [esi] to [edi] using rcx pointer sized words
2696
// generic
2697
void Assembler::rep_mov() {
2698
  emit_int8((unsigned char)0xF3);
2699
  // MOVSQ
2700
  LP64_ONLY(prefix(REX_W));
2701
  emit_int8((unsigned char)0xA5);
2702
}
2703

2704
// sets rcx bytes with rax, value at [edi]
2705
void Assembler::rep_stosb() {
2706
  emit_int8((unsigned char)0xF3); // REP
2707
  LP64_ONLY(prefix(REX_W));
2708
  emit_int8((unsigned char)0xAA); // STOSB
2709
}
2710

2711
// sets rcx pointer sized words with rax, value at [edi]
2712
// generic
2713
void Assembler::rep_stos() {
2714
  emit_int8((unsigned char)0xF3); // REP
2715
  LP64_ONLY(prefix(REX_W));       // LP64:STOSQ, LP32:STOSD
2716
  emit_int8((unsigned char)0xAB);
2717
}
2718

2719
// scans rcx pointer sized words at [edi] for occurance of rax,
2720
// generic
2721
void Assembler::repne_scan() { // repne_scan
2722
  emit_int8((unsigned char)0xF2);
2723
  // SCASQ
2724
  LP64_ONLY(prefix(REX_W));
2725
  emit_int8((unsigned char)0xAF);
2726
}
2727

2728
#ifdef _LP64
2729
// scans rcx 4 byte words at [edi] for occurance of rax,
2730
// generic
2731
void Assembler::repne_scanl() { // repne_scan
2732
  emit_int8((unsigned char)0xF2);
2733
  // SCASL
2734
  emit_int8((unsigned char)0xAF);
2735
}
2736
#endif
2737

2738
void Assembler::ret(int imm16) {
2739
  if (imm16 == 0) {
2740
    emit_int8((unsigned char)0xC3);
2741
  } else {
2742
    emit_int8((unsigned char)0xC2);
2743
    emit_int16(imm16);
2744
  }
2745
}
2746

2747
void Assembler::sahf() {
2748
#ifdef _LP64
2749
  // Not supported in 64bit mode
2750
  ShouldNotReachHere();
2751
#endif
2752
  emit_int8((unsigned char)0x9E);
2753
}
2754

2755
void Assembler::sarl(Register dst, int imm8) {
2756
  int encode = prefix_and_encode(dst->encoding());
2757
  assert(isShiftCount(imm8), "illegal shift count");
2758
  if (imm8 == 1) {
2759
    emit_int8((unsigned char)0xD1);
2760
    emit_int8((unsigned char)(0xF8 | encode));
2761
  } else {
2762
    emit_int8((unsigned char)0xC1);
2763
    emit_int8((unsigned char)(0xF8 | encode));
2764
    emit_int8(imm8);
2765
  }
2766
}
2767

2768
void Assembler::sarl(Register dst) {
2769
  int encode = prefix_and_encode(dst->encoding());
2770
  emit_int8((unsigned char)0xD3);
2771
  emit_int8((unsigned char)(0xF8 | encode));
2772
}
2773

2774
void Assembler::sbbl(Address dst, int32_t imm32) {
2775
  InstructionMark im(this);
2776
  prefix(dst);
2777
  emit_arith_operand(0x81, rbx, dst, imm32);
2778
}
2779

2780
void Assembler::sbbl(Register dst, int32_t imm32) {
2781
  prefix(dst);
2782
  emit_arith(0x81, 0xD8, dst, imm32);
2783
}
2784

2785

2786
void Assembler::sbbl(Register dst, Address src) {
2787
  InstructionMark im(this);
2788
  prefix(src, dst);
2789
  emit_int8(0x1B);
2790
  emit_operand(dst, src);
2791
}
2792

2793
void Assembler::sbbl(Register dst, Register src) {
2794
  (void) prefix_and_encode(dst->encoding(), src->encoding());
2795
  emit_arith(0x1B, 0xC0, dst, src);
2796
}
2797

2798
void Assembler::setb(Condition cc, Register dst) {
2799
  assert(0 <= cc && cc < 16, "illegal cc");
2800
  int encode = prefix_and_encode(dst->encoding(), true);
2801
  emit_int8(0x0F);
2802
  emit_int8((unsigned char)0x90 | cc);
2803
  emit_int8((unsigned char)(0xC0 | encode));
2804
}
2805

2806
void Assembler::shll(Register dst, int imm8) {
2807
  assert(isShiftCount(imm8), "illegal shift count");
2808
  int encode = prefix_and_encode(dst->encoding());
2809
  if (imm8 == 1 ) {
2810
    emit_int8((unsigned char)0xD1);
2811
    emit_int8((unsigned char)(0xE0 | encode));
2812
  } else {
2813
    emit_int8((unsigned char)0xC1);
2814
    emit_int8((unsigned char)(0xE0 | encode));
2815
    emit_int8(imm8);
2816
  }
2817
}
2818

2819
void Assembler::shll(Register dst) {
2820
  int encode = prefix_and_encode(dst->encoding());
2821
  emit_int8((unsigned char)0xD3);
2822
  emit_int8((unsigned char)(0xE0 | encode));
2823
}
2824

2825
void Assembler::shrl(Register dst, int imm8) {
2826
  assert(isShiftCount(imm8), "illegal shift count");
2827
  int encode = prefix_and_encode(dst->encoding());
2828
  emit_int8((unsigned char)0xC1);
2829
  emit_int8((unsigned char)(0xE8 | encode));
2830
  emit_int8(imm8);
2831
}
2832

2833
void Assembler::shrl(Register dst) {
2834
  int encode = prefix_and_encode(dst->encoding());
2835
  emit_int8((unsigned char)0xD3);
2836
  emit_int8((unsigned char)(0xE8 | encode));
2837
}
2838

2839
// copies a single word from [esi] to [edi]
2840
void Assembler::smovl() {
2841
  emit_int8((unsigned char)0xA5);
2842
}
2843

2844
void Assembler::sqrtsd(XMMRegister dst, XMMRegister src) {
2845
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2846
  emit_simd_arith(0x51, dst, src, VEX_SIMD_F2);
2847
}
2848

2849
void Assembler::sqrtsd(XMMRegister dst, Address src) {
2850
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2851
  emit_simd_arith(0x51, dst, src, VEX_SIMD_F2);
2852
}
2853

2854
void Assembler::sqrtss(XMMRegister dst, XMMRegister src) {
2855
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2856
  emit_simd_arith(0x51, dst, src, VEX_SIMD_F3);
2857
}
2858

2859
void Assembler::std() {
2860
  emit_int8((unsigned char)0xFD);
2861
}
2862

2863
void Assembler::sqrtss(XMMRegister dst, Address src) {
2864
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2865
  emit_simd_arith(0x51, dst, src, VEX_SIMD_F3);
2866
}
2867

2868
void Assembler::stmxcsr( Address dst) {
2869
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2870
  InstructionMark im(this);
2871
  prefix(dst);
2872
  emit_int8(0x0F);
2873
  emit_int8((unsigned char)0xAE);
2874
  emit_operand(as_Register(3), dst);
2875
}
2876

2877
void Assembler::subl(Address dst, int32_t imm32) {
2878
  InstructionMark im(this);
2879
  prefix(dst);
2880
  emit_arith_operand(0x81, rbp, dst, imm32);
2881
}
2882

2883
void Assembler::subl(Address dst, Register src) {
2884
  InstructionMark im(this);
2885
  prefix(dst, src);
2886
  emit_int8(0x29);
2887
  emit_operand(src, dst);
2888
}
2889

2890
void Assembler::subl(Register dst, int32_t imm32) {
2891
  prefix(dst);
2892
  emit_arith(0x81, 0xE8, dst, imm32);
2893
}
2894

2895
// Force generation of a 4 byte immediate value even if it fits into 8bit
2896
void Assembler::subl_imm32(Register dst, int32_t imm32) {
2897
  prefix(dst);
2898
  emit_arith_imm32(0x81, 0xE8, dst, imm32);
2899
}
2900

2901
void Assembler::subl(Register dst, Address src) {
2902
  InstructionMark im(this);
2903
  prefix(src, dst);
2904
  emit_int8(0x2B);
2905
  emit_operand(dst, src);
2906
}
2907

2908
void Assembler::subl(Register dst, Register src) {
2909
  (void) prefix_and_encode(dst->encoding(), src->encoding());
2910
  emit_arith(0x2B, 0xC0, dst, src);
2911
}
2912

2913
void Assembler::subsd(XMMRegister dst, XMMRegister src) {
2914
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2915
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_F2);
2916
}
2917

2918
void Assembler::subsd(XMMRegister dst, Address src) {
2919
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2920
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_F2);
2921
}
2922

2923
void Assembler::subss(XMMRegister dst, XMMRegister src) {
2924
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2925
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_F3);
2926
}
2927

2928
void Assembler::subss(XMMRegister dst, Address src) {
2929
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2930
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_F3);
2931
}
2932

2933
void Assembler::testb(Register dst, int imm8) {
2934
  NOT_LP64(assert(dst->has_byte_register(), "must have byte register"));
2935
  (void) prefix_and_encode(dst->encoding(), true);
2936
  emit_arith_b(0xF6, 0xC0, dst, imm8);
2937
}
2938

2939
void Assembler::testl(Register dst, int32_t imm32) {
2940
  // not using emit_arith because test
2941
  // doesn't support sign-extension of
2942
  // 8bit operands
2943
  int encode = dst->encoding();
2944
  if (encode == 0) {
2945
    emit_int8((unsigned char)0xA9);
2946
  } else {
2947
    encode = prefix_and_encode(encode);
2948
    emit_int8((unsigned char)0xF7);
2949
    emit_int8((unsigned char)(0xC0 | encode));
2950
  }
2951
  emit_int32(imm32);
2952
}
2953

2954
void Assembler::testl(Register dst, Register src) {
2955
  (void) prefix_and_encode(dst->encoding(), src->encoding());
2956
  emit_arith(0x85, 0xC0, dst, src);
2957
}
2958

2959
void Assembler::testl(Register dst, Address  src) {
2960
  InstructionMark im(this);
2961
  prefix(src, dst);
2962
  emit_int8((unsigned char)0x85);
2963
  emit_operand(dst, src);
2964
}
2965

2966
void Assembler::tzcntl(Register dst, Register src) {
2967
  assert(VM_Version::supports_bmi1(), "tzcnt instruction not supported");
2968
  emit_int8((unsigned char)0xF3);
2969
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
2970
  emit_int8(0x0F);
2971
  emit_int8((unsigned char)0xBC);
2972
  emit_int8((unsigned char)0xC0 | encode);
2973
}
2974

2975
void Assembler::tzcntq(Register dst, Register src) {
2976
  assert(VM_Version::supports_bmi1(), "tzcnt instruction not supported");
2977
  emit_int8((unsigned char)0xF3);
2978
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
2979
  emit_int8(0x0F);
2980
  emit_int8((unsigned char)0xBC);
2981
  emit_int8((unsigned char)(0xC0 | encode));
2982
}
2983

2984
void Assembler::ucomisd(XMMRegister dst, Address src) {
2985
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2986
  emit_simd_arith_nonds(0x2E, dst, src, VEX_SIMD_66);
2987
}
2988

2989
void Assembler::ucomisd(XMMRegister dst, XMMRegister src) {
2990
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
2991
  emit_simd_arith_nonds(0x2E, dst, src, VEX_SIMD_66);
2992
}
2993

2994
void Assembler::ucomiss(XMMRegister dst, Address src) {
2995
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
2996
  emit_simd_arith_nonds(0x2E, dst, src, VEX_SIMD_NONE);
2997
}
2998

2999
void Assembler::ucomiss(XMMRegister dst, XMMRegister src) {
3000
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
3001
  emit_simd_arith_nonds(0x2E, dst, src, VEX_SIMD_NONE);
3002
}
3003

3004
void Assembler::xabort(int8_t imm8) {
3005
  emit_int8((unsigned char)0xC6);
3006
  emit_int8((unsigned char)0xF8);
3007
  emit_int8((unsigned char)(imm8 & 0xFF));
3008
}
3009

3010
void Assembler::xaddl(Address dst, Register src) {
3011
  InstructionMark im(this);
3012
  prefix(dst, src);
3013
  emit_int8(0x0F);
3014
  emit_int8((unsigned char)0xC1);
3015
  emit_operand(src, dst);
3016
}
3017

3018
void Assembler::xbegin(Label& abort, relocInfo::relocType rtype) {
3019
  InstructionMark im(this);
3020
  relocate(rtype);
3021
  if (abort.is_bound()) {
3022
    address entry = target(abort);
3023
    assert(entry != NULL, "abort entry NULL");
3024
    intptr_t offset = entry - pc();
3025
    emit_int8((unsigned char)0xC7);
3026
    emit_int8((unsigned char)0xF8);
3027
    emit_int32(offset - 6); // 2 opcode + 4 address
3028
  } else {
3029
    abort.add_patch_at(code(), locator());
3030
    emit_int8((unsigned char)0xC7);
3031
    emit_int8((unsigned char)0xF8);
3032
    emit_int32(0);
3033
  }
3034
}
3035

3036
void Assembler::xchgl(Register dst, Address src) { // xchg
3037
  InstructionMark im(this);
3038
  prefix(src, dst);
3039
  emit_int8((unsigned char)0x87);
3040
  emit_operand(dst, src);
3041
}
3042

3043
void Assembler::xchgl(Register dst, Register src) {
3044
  int encode = prefix_and_encode(dst->encoding(), src->encoding());
3045
  emit_int8((unsigned char)0x87);
3046
  emit_int8((unsigned char)(0xC0 | encode));
3047
}
3048

3049
void Assembler::xend() {
3050
  emit_int8((unsigned char)0x0F);
3051
  emit_int8((unsigned char)0x01);
3052
  emit_int8((unsigned char)0xD5);
3053
}
3054

3055
void Assembler::xgetbv() {
3056
  emit_int8(0x0F);
3057
  emit_int8(0x01);
3058
  emit_int8((unsigned char)0xD0);
3059
}
3060

3061
void Assembler::xorl(Register dst, int32_t imm32) {
3062
  prefix(dst);
3063
  emit_arith(0x81, 0xF0, dst, imm32);
3064
}
3065

3066
void Assembler::xorl(Register dst, Address src) {
3067
  InstructionMark im(this);
3068
  prefix(src, dst);
3069
  emit_int8(0x33);
3070
  emit_operand(dst, src);
3071
}
3072

3073
void Assembler::xorl(Register dst, Register src) {
3074
  (void) prefix_and_encode(dst->encoding(), src->encoding());
3075
  emit_arith(0x33, 0xC0, dst, src);
3076
}
3077

3078

3079
// AVX 3-operands scalar float-point arithmetic instructions
3080

3081
void Assembler::vaddsd(XMMRegister dst, XMMRegister nds, Address src) {
3082
  assert(VM_Version::supports_avx(), "");
3083
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3084
}
3085

3086
void Assembler::vaddsd(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3087
  assert(VM_Version::supports_avx(), "");
3088
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3089
}
3090

3091
void Assembler::vaddss(XMMRegister dst, XMMRegister nds, Address src) {
3092
  assert(VM_Version::supports_avx(), "");
3093
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3094
}
3095

3096
void Assembler::vaddss(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3097
  assert(VM_Version::supports_avx(), "");
3098
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3099
}
3100

3101
void Assembler::vdivsd(XMMRegister dst, XMMRegister nds, Address src) {
3102
  assert(VM_Version::supports_avx(), "");
3103
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3104
}
3105

3106
void Assembler::vdivsd(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3107
  assert(VM_Version::supports_avx(), "");
3108
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3109
}
3110

3111
void Assembler::vdivss(XMMRegister dst, XMMRegister nds, Address src) {
3112
  assert(VM_Version::supports_avx(), "");
3113
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3114
}
3115

3116
void Assembler::vdivss(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3117
  assert(VM_Version::supports_avx(), "");
3118
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3119
}
3120

3121
void Assembler::vmulsd(XMMRegister dst, XMMRegister nds, Address src) {
3122
  assert(VM_Version::supports_avx(), "");
3123
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3124
}
3125

3126
void Assembler::vmulsd(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3127
  assert(VM_Version::supports_avx(), "");
3128
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3129
}
3130

3131
void Assembler::vmulss(XMMRegister dst, XMMRegister nds, Address src) {
3132
  assert(VM_Version::supports_avx(), "");
3133
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3134
}
3135

3136
void Assembler::vmulss(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3137
  assert(VM_Version::supports_avx(), "");
3138
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3139
}
3140

3141
void Assembler::vsubsd(XMMRegister dst, XMMRegister nds, Address src) {
3142
  assert(VM_Version::supports_avx(), "");
3143
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3144
}
3145

3146
void Assembler::vsubsd(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3147
  assert(VM_Version::supports_avx(), "");
3148
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_F2, /* vector256 */ false);
3149
}
3150

3151
void Assembler::vsubss(XMMRegister dst, XMMRegister nds, Address src) {
3152
  assert(VM_Version::supports_avx(), "");
3153
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3154
}
3155

3156
void Assembler::vsubss(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3157
  assert(VM_Version::supports_avx(), "");
3158
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_F3, /* vector256 */ false);
3159
}
3160

3161
//====================VECTOR ARITHMETIC=====================================
3162

3163
// Float-point vector arithmetic
3164

3165
void Assembler::addpd(XMMRegister dst, XMMRegister src) {
3166
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3167
  emit_simd_arith(0x58, dst, src, VEX_SIMD_66);
3168
}
3169

3170
void Assembler::addps(XMMRegister dst, XMMRegister src) {
3171
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3172
  emit_simd_arith(0x58, dst, src, VEX_SIMD_NONE);
3173
}
3174

3175
void Assembler::vaddpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3176
  assert(VM_Version::supports_avx(), "");
3177
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_66, vector256);
3178
}
3179

3180
void Assembler::vaddps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3181
  assert(VM_Version::supports_avx(), "");
3182
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_NONE, vector256);
3183
}
3184

3185
void Assembler::vaddpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3186
  assert(VM_Version::supports_avx(), "");
3187
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_66, vector256);
3188
}
3189

3190
void Assembler::vaddps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3191
  assert(VM_Version::supports_avx(), "");
3192
  emit_vex_arith(0x58, dst, nds, src, VEX_SIMD_NONE, vector256);
3193
}
3194

3195
void Assembler::subpd(XMMRegister dst, XMMRegister src) {
3196
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3197
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_66);
3198
}
3199

3200
void Assembler::subps(XMMRegister dst, XMMRegister src) {
3201
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3202
  emit_simd_arith(0x5C, dst, src, VEX_SIMD_NONE);
3203
}
3204

3205
void Assembler::vsubpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3206
  assert(VM_Version::supports_avx(), "");
3207
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_66, vector256);
3208
}
3209

3210
void Assembler::vsubps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3211
  assert(VM_Version::supports_avx(), "");
3212
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_NONE, vector256);
3213
}
3214

3215
void Assembler::vsubpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3216
  assert(VM_Version::supports_avx(), "");
3217
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_66, vector256);
3218
}
3219

3220
void Assembler::vsubps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3221
  assert(VM_Version::supports_avx(), "");
3222
  emit_vex_arith(0x5C, dst, nds, src, VEX_SIMD_NONE, vector256);
3223
}
3224

3225
void Assembler::mulpd(XMMRegister dst, XMMRegister src) {
3226
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3227
  emit_simd_arith(0x59, dst, src, VEX_SIMD_66);
3228
}
3229

3230
void Assembler::mulps(XMMRegister dst, XMMRegister src) {
3231
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3232
  emit_simd_arith(0x59, dst, src, VEX_SIMD_NONE);
3233
}
3234

3235
void Assembler::vmulpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3236
  assert(VM_Version::supports_avx(), "");
3237
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_66, vector256);
3238
}
3239

3240
void Assembler::vmulps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3241
  assert(VM_Version::supports_avx(), "");
3242
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_NONE, vector256);
3243
}
3244

3245
void Assembler::vmulpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3246
  assert(VM_Version::supports_avx(), "");
3247
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_66, vector256);
3248
}
3249

3250
void Assembler::vmulps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3251
  assert(VM_Version::supports_avx(), "");
3252
  emit_vex_arith(0x59, dst, nds, src, VEX_SIMD_NONE, vector256);
3253
}
3254

3255
void Assembler::divpd(XMMRegister dst, XMMRegister src) {
3256
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3257
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_66);
3258
}
3259

3260
void Assembler::divps(XMMRegister dst, XMMRegister src) {
3261
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3262
  emit_simd_arith(0x5E, dst, src, VEX_SIMD_NONE);
3263
}
3264

3265
void Assembler::vdivpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3266
  assert(VM_Version::supports_avx(), "");
3267
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_66, vector256);
3268
}
3269

3270
void Assembler::vdivps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3271
  assert(VM_Version::supports_avx(), "");
3272
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_NONE, vector256);
3273
}
3274

3275
void Assembler::vdivpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3276
  assert(VM_Version::supports_avx(), "");
3277
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_66, vector256);
3278
}
3279

3280
void Assembler::vdivps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3281
  assert(VM_Version::supports_avx(), "");
3282
  emit_vex_arith(0x5E, dst, nds, src, VEX_SIMD_NONE, vector256);
3283
}
3284

3285
void Assembler::andpd(XMMRegister dst, XMMRegister src) {
3286
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3287
  emit_simd_arith(0x54, dst, src, VEX_SIMD_66);
3288
}
3289

3290
void Assembler::andps(XMMRegister dst, XMMRegister src) {
3291
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
3292
  emit_simd_arith(0x54, dst, src, VEX_SIMD_NONE);
3293
}
3294

3295
void Assembler::andps(XMMRegister dst, Address src) {
3296
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
3297
  emit_simd_arith(0x54, dst, src, VEX_SIMD_NONE);
3298
}
3299

3300
void Assembler::andpd(XMMRegister dst, Address src) {
3301
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3302
  emit_simd_arith(0x54, dst, src, VEX_SIMD_66);
3303
}
3304

3305
void Assembler::vandpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3306
  assert(VM_Version::supports_avx(), "");
3307
  emit_vex_arith(0x54, dst, nds, src, VEX_SIMD_66, vector256);
3308
}
3309

3310
void Assembler::vandps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3311
  assert(VM_Version::supports_avx(), "");
3312
  emit_vex_arith(0x54, dst, nds, src, VEX_SIMD_NONE, vector256);
3313
}
3314

3315
void Assembler::vandpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3316
  assert(VM_Version::supports_avx(), "");
3317
  emit_vex_arith(0x54, dst, nds, src, VEX_SIMD_66, vector256);
3318
}
3319

3320
void Assembler::vandps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3321
  assert(VM_Version::supports_avx(), "");
3322
  emit_vex_arith(0x54, dst, nds, src, VEX_SIMD_NONE, vector256);
3323
}
3324

3325
void Assembler::xorpd(XMMRegister dst, XMMRegister src) {
3326
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3327
  emit_simd_arith(0x57, dst, src, VEX_SIMD_66);
3328
}
3329

3330
void Assembler::xorps(XMMRegister dst, XMMRegister src) {
3331
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
3332
  emit_simd_arith(0x57, dst, src, VEX_SIMD_NONE);
3333
}
3334

3335
void Assembler::xorpd(XMMRegister dst, Address src) {
3336
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3337
  emit_simd_arith(0x57, dst, src, VEX_SIMD_66);
3338
}
3339

3340
void Assembler::xorps(XMMRegister dst, Address src) {
3341
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
3342
  emit_simd_arith(0x57, dst, src, VEX_SIMD_NONE);
3343
}
3344

3345
void Assembler::vxorpd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3346
  assert(VM_Version::supports_avx(), "");
3347
  emit_vex_arith(0x57, dst, nds, src, VEX_SIMD_66, vector256);
3348
}
3349

3350
void Assembler::vxorps(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3351
  assert(VM_Version::supports_avx(), "");
3352
  emit_vex_arith(0x57, dst, nds, src, VEX_SIMD_NONE, vector256);
3353
}
3354

3355
void Assembler::vxorpd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3356
  assert(VM_Version::supports_avx(), "");
3357
  emit_vex_arith(0x57, dst, nds, src, VEX_SIMD_66, vector256);
3358
}
3359

3360
void Assembler::vxorps(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3361
  assert(VM_Version::supports_avx(), "");
3362
  emit_vex_arith(0x57, dst, nds, src, VEX_SIMD_NONE, vector256);
3363
}
3364

3365

3366
// Integer vector arithmetic
3367
void Assembler::paddb(XMMRegister dst, XMMRegister src) {
3368
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3369
  emit_simd_arith(0xFC, dst, src, VEX_SIMD_66);
3370
}
3371

3372
void Assembler::paddw(XMMRegister dst, XMMRegister src) {
3373
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3374
  emit_simd_arith(0xFD, dst, src, VEX_SIMD_66);
3375
}
3376

3377
void Assembler::paddd(XMMRegister dst, XMMRegister src) {
3378
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3379
  emit_simd_arith(0xFE, dst, src, VEX_SIMD_66);
3380
}
3381

3382
void Assembler::paddq(XMMRegister dst, XMMRegister src) {
3383
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3384
  emit_simd_arith(0xD4, dst, src, VEX_SIMD_66);
3385
}
3386

3387
void Assembler::vpaddb(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3388
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3389
  emit_vex_arith(0xFC, dst, nds, src, VEX_SIMD_66, vector256);
3390
}
3391

3392
void Assembler::vpaddw(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3393
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3394
  emit_vex_arith(0xFD, dst, nds, src, VEX_SIMD_66, vector256);
3395
}
3396

3397
void Assembler::vpaddd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3398
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3399
  emit_vex_arith(0xFE, dst, nds, src, VEX_SIMD_66, vector256);
3400
}
3401

3402
void Assembler::vpaddq(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3403
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3404
  emit_vex_arith(0xD4, dst, nds, src, VEX_SIMD_66, vector256);
3405
}
3406

3407
void Assembler::vpaddb(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3408
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3409
  emit_vex_arith(0xFC, dst, nds, src, VEX_SIMD_66, vector256);
3410
}
3411

3412
void Assembler::vpaddw(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3413
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3414
  emit_vex_arith(0xFD, dst, nds, src, VEX_SIMD_66, vector256);
3415
}
3416

3417
void Assembler::vpaddd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3418
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3419
  emit_vex_arith(0xFE, dst, nds, src, VEX_SIMD_66, vector256);
3420
}
3421

3422
void Assembler::vpaddq(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3423
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3424
  emit_vex_arith(0xD4, dst, nds, src, VEX_SIMD_66, vector256);
3425
}
3426

3427
void Assembler::psubb(XMMRegister dst, XMMRegister src) {
3428
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3429
  emit_simd_arith(0xF8, dst, src, VEX_SIMD_66);
3430
}
3431

3432
void Assembler::psubw(XMMRegister dst, XMMRegister src) {
3433
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3434
  emit_simd_arith(0xF9, dst, src, VEX_SIMD_66);
3435
}
3436

3437
void Assembler::psubd(XMMRegister dst, XMMRegister src) {
3438
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3439
  emit_simd_arith(0xFA, dst, src, VEX_SIMD_66);
3440
}
3441

3442
void Assembler::psubq(XMMRegister dst, XMMRegister src) {
3443
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3444
  emit_simd_arith(0xFB, dst, src, VEX_SIMD_66);
3445
}
3446

3447
void Assembler::vpsubb(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3448
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3449
  emit_vex_arith(0xF8, dst, nds, src, VEX_SIMD_66, vector256);
3450
}
3451

3452
void Assembler::vpsubw(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3453
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3454
  emit_vex_arith(0xF9, dst, nds, src, VEX_SIMD_66, vector256);
3455
}
3456

3457
void Assembler::vpsubd(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3458
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3459
  emit_vex_arith(0xFA, dst, nds, src, VEX_SIMD_66, vector256);
3460
}
3461

3462
void Assembler::vpsubq(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3463
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3464
  emit_vex_arith(0xFB, dst, nds, src, VEX_SIMD_66, vector256);
3465
}
3466

3467
void Assembler::vpsubb(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3468
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3469
  emit_vex_arith(0xF8, dst, nds, src, VEX_SIMD_66, vector256);
3470
}
3471

3472
void Assembler::vpsubw(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3473
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3474
  emit_vex_arith(0xF9, dst, nds, src, VEX_SIMD_66, vector256);
3475
}
3476

3477
void Assembler::vpsubd(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3478
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3479
  emit_vex_arith(0xFA, dst, nds, src, VEX_SIMD_66, vector256);
3480
}
3481

3482
void Assembler::vpsubq(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3483
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3484
  emit_vex_arith(0xFB, dst, nds, src, VEX_SIMD_66, vector256);
3485
}
3486

3487
void Assembler::pmullw(XMMRegister dst, XMMRegister src) {
3488
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3489
  emit_simd_arith(0xD5, dst, src, VEX_SIMD_66);
3490
}
3491

3492
void Assembler::pmulld(XMMRegister dst, XMMRegister src) {
3493
  assert(VM_Version::supports_sse4_1(), "");
3494
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_38);
3495
  emit_int8(0x40);
3496
  emit_int8((unsigned char)(0xC0 | encode));
3497
}
3498

3499
void Assembler::vpmullw(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3500
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3501
  emit_vex_arith(0xD5, dst, nds, src, VEX_SIMD_66, vector256);
3502
}
3503

3504
void Assembler::vpmulld(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3505
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3506
  int encode = vex_prefix_and_encode(dst, nds, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_38);
3507
  emit_int8(0x40);
3508
  emit_int8((unsigned char)(0xC0 | encode));
3509
}
3510

3511
void Assembler::vpmullw(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3512
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3513
  emit_vex_arith(0xD5, dst, nds, src, VEX_SIMD_66, vector256);
3514
}
3515

3516
void Assembler::vpmulld(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3517
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3518
  InstructionMark im(this);
3519
  int dst_enc = dst->encoding();
3520
  int nds_enc = nds->is_valid() ? nds->encoding() : 0;
3521
  vex_prefix(src, nds_enc, dst_enc, VEX_SIMD_66, VEX_OPCODE_0F_38, false, vector256);
3522
  emit_int8(0x40);
3523
  emit_operand(dst, src);
3524
}
3525

3526
// Shift packed integers left by specified number of bits.
3527
void Assembler::psllw(XMMRegister dst, int shift) {
3528
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3529
  // XMM6 is for /6 encoding: 66 0F 71 /6 ib
3530
  int encode = simd_prefix_and_encode(xmm6, dst, dst, VEX_SIMD_66);
3531
  emit_int8(0x71);
3532
  emit_int8((unsigned char)(0xC0 | encode));
3533
  emit_int8(shift & 0xFF);
3534
}
3535

3536
void Assembler::pslld(XMMRegister dst, int shift) {
3537
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3538
  // XMM6 is for /6 encoding: 66 0F 72 /6 ib
3539
  int encode = simd_prefix_and_encode(xmm6, dst, dst, VEX_SIMD_66);
3540
  emit_int8(0x72);
3541
  emit_int8((unsigned char)(0xC0 | encode));
3542
  emit_int8(shift & 0xFF);
3543
}
3544

3545
void Assembler::psllq(XMMRegister dst, int shift) {
3546
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3547
  // XMM6 is for /6 encoding: 66 0F 73 /6 ib
3548
  int encode = simd_prefix_and_encode(xmm6, dst, dst, VEX_SIMD_66);
3549
  emit_int8(0x73);
3550
  emit_int8((unsigned char)(0xC0 | encode));
3551
  emit_int8(shift & 0xFF);
3552
}
3553

3554
void Assembler::psllw(XMMRegister dst, XMMRegister shift) {
3555
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3556
  emit_simd_arith(0xF1, dst, shift, VEX_SIMD_66);
3557
}
3558

3559
void Assembler::pslld(XMMRegister dst, XMMRegister shift) {
3560
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3561
  emit_simd_arith(0xF2, dst, shift, VEX_SIMD_66);
3562
}
3563

3564
void Assembler::psllq(XMMRegister dst, XMMRegister shift) {
3565
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3566
  emit_simd_arith(0xF3, dst, shift, VEX_SIMD_66);
3567
}
3568

3569
void Assembler::vpsllw(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3570
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3571
  // XMM6 is for /6 encoding: 66 0F 71 /6 ib
3572
  emit_vex_arith(0x71, xmm6, dst, src, VEX_SIMD_66, vector256);
3573
  emit_int8(shift & 0xFF);
3574
}
3575

3576
void Assembler::vpslld(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3577
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3578
  // XMM6 is for /6 encoding: 66 0F 72 /6 ib
3579
  emit_vex_arith(0x72, xmm6, dst, src, VEX_SIMD_66, vector256);
3580
  emit_int8(shift & 0xFF);
3581
}
3582

3583
void Assembler::vpsllq(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3584
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3585
  // XMM6 is for /6 encoding: 66 0F 73 /6 ib
3586
  emit_vex_arith(0x73, xmm6, dst, src, VEX_SIMD_66, vector256);
3587
  emit_int8(shift & 0xFF);
3588
}
3589

3590
void Assembler::vpsllw(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3591
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3592
  emit_vex_arith(0xF1, dst, src, shift, VEX_SIMD_66, vector256);
3593
}
3594

3595
void Assembler::vpslld(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3596
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3597
  emit_vex_arith(0xF2, dst, src, shift, VEX_SIMD_66, vector256);
3598
}
3599

3600
void Assembler::vpsllq(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3601
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3602
  emit_vex_arith(0xF3, dst, src, shift, VEX_SIMD_66, vector256);
3603
}
3604

3605
// Shift packed integers logically right by specified number of bits.
3606
void Assembler::psrlw(XMMRegister dst, int shift) {
3607
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3608
  // XMM2 is for /2 encoding: 66 0F 71 /2 ib
3609
  int encode = simd_prefix_and_encode(xmm2, dst, dst, VEX_SIMD_66);
3610
  emit_int8(0x71);
3611
  emit_int8((unsigned char)(0xC0 | encode));
3612
  emit_int8(shift & 0xFF);
3613
}
3614

3615
void Assembler::psrld(XMMRegister dst, int shift) {
3616
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3617
  // XMM2 is for /2 encoding: 66 0F 72 /2 ib
3618
  int encode = simd_prefix_and_encode(xmm2, dst, dst, VEX_SIMD_66);
3619
  emit_int8(0x72);
3620
  emit_int8((unsigned char)(0xC0 | encode));
3621
  emit_int8(shift & 0xFF);
3622
}
3623

3624
void Assembler::psrlq(XMMRegister dst, int shift) {
3625
  // Do not confuse it with psrldq SSE2 instruction which
3626
  // shifts 128 bit value in xmm register by number of bytes.
3627
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3628
  // XMM2 is for /2 encoding: 66 0F 73 /2 ib
3629
  int encode = simd_prefix_and_encode(xmm2, dst, dst, VEX_SIMD_66);
3630
  emit_int8(0x73);
3631
  emit_int8((unsigned char)(0xC0 | encode));
3632
  emit_int8(shift & 0xFF);
3633
}
3634

3635
void Assembler::psrlw(XMMRegister dst, XMMRegister shift) {
3636
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3637
  emit_simd_arith(0xD1, dst, shift, VEX_SIMD_66);
3638
}
3639

3640
void Assembler::psrld(XMMRegister dst, XMMRegister shift) {
3641
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3642
  emit_simd_arith(0xD2, dst, shift, VEX_SIMD_66);
3643
}
3644

3645
void Assembler::psrlq(XMMRegister dst, XMMRegister shift) {
3646
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3647
  emit_simd_arith(0xD3, dst, shift, VEX_SIMD_66);
3648
}
3649

3650
void Assembler::vpsrlw(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3651
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3652
  // XMM2 is for /2 encoding: 66 0F 73 /2 ib
3653
  emit_vex_arith(0x71, xmm2, dst, src, VEX_SIMD_66, vector256);
3654
  emit_int8(shift & 0xFF);
3655
}
3656

3657
void Assembler::vpsrld(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3658
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3659
  // XMM2 is for /2 encoding: 66 0F 73 /2 ib
3660
  emit_vex_arith(0x72, xmm2, dst, src, VEX_SIMD_66, vector256);
3661
  emit_int8(shift & 0xFF);
3662
}
3663

3664
void Assembler::vpsrlq(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3665
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3666
  // XMM2 is for /2 encoding: 66 0F 73 /2 ib
3667
  emit_vex_arith(0x73, xmm2, dst, src, VEX_SIMD_66, vector256);
3668
  emit_int8(shift & 0xFF);
3669
}
3670

3671
void Assembler::vpsrlw(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3672
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3673
  emit_vex_arith(0xD1, dst, src, shift, VEX_SIMD_66, vector256);
3674
}
3675

3676
void Assembler::vpsrld(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3677
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3678
  emit_vex_arith(0xD2, dst, src, shift, VEX_SIMD_66, vector256);
3679
}
3680

3681
void Assembler::vpsrlq(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3682
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3683
  emit_vex_arith(0xD3, dst, src, shift, VEX_SIMD_66, vector256);
3684
}
3685

3686
// Shift packed integers arithmetically right by specified number of bits.
3687
void Assembler::psraw(XMMRegister dst, int shift) {
3688
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3689
  // XMM4 is for /4 encoding: 66 0F 71 /4 ib
3690
  int encode = simd_prefix_and_encode(xmm4, dst, dst, VEX_SIMD_66);
3691
  emit_int8(0x71);
3692
  emit_int8((unsigned char)(0xC0 | encode));
3693
  emit_int8(shift & 0xFF);
3694
}
3695

3696
void Assembler::psrad(XMMRegister dst, int shift) {
3697
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3698
  // XMM4 is for /4 encoding: 66 0F 72 /4 ib
3699
  int encode = simd_prefix_and_encode(xmm4, dst, dst, VEX_SIMD_66);
3700
  emit_int8(0x72);
3701
  emit_int8((unsigned char)(0xC0 | encode));
3702
  emit_int8(shift & 0xFF);
3703
}
3704

3705
void Assembler::psraw(XMMRegister dst, XMMRegister shift) {
3706
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3707
  emit_simd_arith(0xE1, dst, shift, VEX_SIMD_66);
3708
}
3709

3710
void Assembler::psrad(XMMRegister dst, XMMRegister shift) {
3711
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3712
  emit_simd_arith(0xE2, dst, shift, VEX_SIMD_66);
3713
}
3714

3715
void Assembler::vpsraw(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3716
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3717
  // XMM4 is for /4 encoding: 66 0F 71 /4 ib
3718
  emit_vex_arith(0x71, xmm4, dst, src, VEX_SIMD_66, vector256);
3719
  emit_int8(shift & 0xFF);
3720
}
3721

3722
void Assembler::vpsrad(XMMRegister dst, XMMRegister src, int shift, bool vector256) {
3723
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3724
  // XMM4 is for /4 encoding: 66 0F 71 /4 ib
3725
  emit_vex_arith(0x72, xmm4, dst, src, VEX_SIMD_66, vector256);
3726
  emit_int8(shift & 0xFF);
3727
}
3728

3729
void Assembler::vpsraw(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3730
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3731
  emit_vex_arith(0xE1, dst, src, shift, VEX_SIMD_66, vector256);
3732
}
3733

3734
void Assembler::vpsrad(XMMRegister dst, XMMRegister src, XMMRegister shift, bool vector256) {
3735
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3736
  emit_vex_arith(0xE2, dst, src, shift, VEX_SIMD_66, vector256);
3737
}
3738

3739

3740
// AND packed integers
3741
void Assembler::pand(XMMRegister dst, XMMRegister src) {
3742
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3743
  emit_simd_arith(0xDB, dst, src, VEX_SIMD_66);
3744
}
3745

3746
void Assembler::vpand(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3747
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3748
  emit_vex_arith(0xDB, dst, nds, src, VEX_SIMD_66, vector256);
3749
}
3750

3751
void Assembler::vpand(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3752
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3753
  emit_vex_arith(0xDB, dst, nds, src, VEX_SIMD_66, vector256);
3754
}
3755

3756
void Assembler::por(XMMRegister dst, XMMRegister src) {
3757
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3758
  emit_simd_arith(0xEB, dst, src, VEX_SIMD_66);
3759
}
3760

3761
void Assembler::vpor(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3762
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3763
  emit_vex_arith(0xEB, dst, nds, src, VEX_SIMD_66, vector256);
3764
}
3765

3766
void Assembler::vpor(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3767
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3768
  emit_vex_arith(0xEB, dst, nds, src, VEX_SIMD_66, vector256);
3769
}
3770

3771
void Assembler::pxor(XMMRegister dst, XMMRegister src) {
3772
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
3773
  emit_simd_arith(0xEF, dst, src, VEX_SIMD_66);
3774
}
3775

3776
void Assembler::vpxor(XMMRegister dst, XMMRegister nds, XMMRegister src, bool vector256) {
3777
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3778
  emit_vex_arith(0xEF, dst, nds, src, VEX_SIMD_66, vector256);
3779
}
3780

3781
void Assembler::vpxor(XMMRegister dst, XMMRegister nds, Address src, bool vector256) {
3782
  assert(VM_Version::supports_avx() && !vector256 || VM_Version::supports_avx2(), "256 bit integer vectors requires AVX2");
3783
  emit_vex_arith(0xEF, dst, nds, src, VEX_SIMD_66, vector256);
3784
}
3785

3786

3787
void Assembler::vinsertf128h(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3788
  assert(VM_Version::supports_avx(), "");
3789
  bool vector256 = true;
3790
  int encode = vex_prefix_and_encode(dst, nds, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_3A);
3791
  emit_int8(0x18);
3792
  emit_int8((unsigned char)(0xC0 | encode));
3793
  // 0x00 - insert into lower 128 bits
3794
  // 0x01 - insert into upper 128 bits
3795
  emit_int8(0x01);
3796
}
3797

3798
void Assembler::vinsertf128h(XMMRegister dst, Address src) {
3799
  assert(VM_Version::supports_avx(), "");
3800
  InstructionMark im(this);
3801
  bool vector256 = true;
3802
  assert(dst != xnoreg, "sanity");
3803
  int dst_enc = dst->encoding();
3804
  // swap src<->dst for encoding
3805
  vex_prefix(src, dst_enc, dst_enc, VEX_SIMD_66, VEX_OPCODE_0F_3A, false, vector256);
3806
  emit_int8(0x18);
3807
  emit_operand(dst, src);
3808
  // 0x01 - insert into upper 128 bits
3809
  emit_int8(0x01);
3810
}
3811

3812
void Assembler::vextractf128h(Address dst, XMMRegister src) {
3813
  assert(VM_Version::supports_avx(), "");
3814
  InstructionMark im(this);
3815
  bool vector256 = true;
3816
  assert(src != xnoreg, "sanity");
3817
  int src_enc = src->encoding();
3818
  vex_prefix(dst, 0, src_enc, VEX_SIMD_66, VEX_OPCODE_0F_3A, false, vector256);
3819
  emit_int8(0x19);
3820
  emit_operand(src, dst);
3821
  // 0x01 - extract from upper 128 bits
3822
  emit_int8(0x01);
3823
}
3824

3825
void Assembler::vinserti128h(XMMRegister dst, XMMRegister nds, XMMRegister src) {
3826
  assert(VM_Version::supports_avx2(), "");
3827
  bool vector256 = true;
3828
  int encode = vex_prefix_and_encode(dst, nds, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_3A);
3829
  emit_int8(0x38);
3830
  emit_int8((unsigned char)(0xC0 | encode));
3831
  // 0x00 - insert into lower 128 bits
3832
  // 0x01 - insert into upper 128 bits
3833
  emit_int8(0x01);
3834
}
3835

3836
void Assembler::vinserti128h(XMMRegister dst, Address src) {
3837
  assert(VM_Version::supports_avx2(), "");
3838
  InstructionMark im(this);
3839
  bool vector256 = true;
3840
  assert(dst != xnoreg, "sanity");
3841
  int dst_enc = dst->encoding();
3842
  // swap src<->dst for encoding
3843
  vex_prefix(src, dst_enc, dst_enc, VEX_SIMD_66, VEX_OPCODE_0F_3A, false, vector256);
3844
  emit_int8(0x38);
3845
  emit_operand(dst, src);
3846
  // 0x01 - insert into upper 128 bits
3847
  emit_int8(0x01);
3848
}
3849

3850
void Assembler::vextracti128h(Address dst, XMMRegister src) {
3851
  assert(VM_Version::supports_avx2(), "");
3852
  InstructionMark im(this);
3853
  bool vector256 = true;
3854
  assert(src != xnoreg, "sanity");
3855
  int src_enc = src->encoding();
3856
  vex_prefix(dst, 0, src_enc, VEX_SIMD_66, VEX_OPCODE_0F_3A, false, vector256);
3857
  emit_int8(0x39);
3858
  emit_operand(src, dst);
3859
  // 0x01 - extract from upper 128 bits
3860
  emit_int8(0x01);
3861
}
3862

3863
// duplicate 4-bytes integer data from src into 8 locations in dest
3864
void Assembler::vpbroadcastd(XMMRegister dst, XMMRegister src) {
3865
  assert(VM_Version::supports_avx2(), "");
3866
  bool vector256 = true;
3867
  int encode = vex_prefix_and_encode(dst, xnoreg, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_38);
3868
  emit_int8(0x58);
3869
  emit_int8((unsigned char)(0xC0 | encode));
3870
}
3871

3872
// Carry-Less Multiplication Quadword
3873
void Assembler::pclmulqdq(XMMRegister dst, XMMRegister src, int mask) {
3874
  assert(VM_Version::supports_clmul(), "");
3875
  int encode = simd_prefix_and_encode(dst, dst, src, VEX_SIMD_66, VEX_OPCODE_0F_3A);
3876
  emit_int8(0x44);
3877
  emit_int8((unsigned char)(0xC0 | encode));
3878
  emit_int8((unsigned char)mask);
3879
}
3880

3881
// Carry-Less Multiplication Quadword
3882
void Assembler::vpclmulqdq(XMMRegister dst, XMMRegister nds, XMMRegister src, int mask) {
3883
  assert(VM_Version::supports_avx() && VM_Version::supports_clmul(), "");
3884
  bool vector256 = false;
3885
  int encode = vex_prefix_and_encode(dst, nds, src, VEX_SIMD_66, vector256, VEX_OPCODE_0F_3A);
3886
  emit_int8(0x44);
3887
  emit_int8((unsigned char)(0xC0 | encode));
3888
  emit_int8((unsigned char)mask);
3889
}
3890

3891
void Assembler::vzeroupper() {
3892
  assert(VM_Version::supports_avx(), "");
3893
  (void)vex_prefix_and_encode(xmm0, xmm0, xmm0, VEX_SIMD_NONE);
3894
  emit_int8(0x77);
3895
}
3896

3897

3898
#ifndef _LP64
3899
// 32bit only pieces of the assembler
3900

3901
void Assembler::cmp_literal32(Register src1, int32_t imm32, RelocationHolder const& rspec) {
3902
  // NO PREFIX AS NEVER 64BIT
3903
  InstructionMark im(this);
3904
  emit_int8((unsigned char)0x81);
3905
  emit_int8((unsigned char)(0xF8 | src1->encoding()));
3906
  emit_data(imm32, rspec, 0);
3907
}
3908

3909
void Assembler::cmp_literal32(Address src1, int32_t imm32, RelocationHolder const& rspec) {
3910
  // NO PREFIX AS NEVER 64BIT (not even 32bit versions of 64bit regs
3911
  InstructionMark im(this);
3912
  emit_int8((unsigned char)0x81);
3913
  emit_operand(rdi, src1);
3914
  emit_data(imm32, rspec, 0);
3915
}
3916

3917
// The 64-bit (32bit platform) cmpxchg compares the value at adr with the contents of rdx:rax,
3918
// and stores rcx:rbx into adr if so; otherwise, the value at adr is loaded
3919
// into rdx:rax.  The ZF is set if the compared values were equal, and cleared otherwise.
3920
void Assembler::cmpxchg8(Address adr) {
3921
  InstructionMark im(this);
3922
  emit_int8(0x0F);
3923
  emit_int8((unsigned char)0xC7);
3924
  emit_operand(rcx, adr);
3925
}
3926

3927
void Assembler::decl(Register dst) {
3928
  // Don't use it directly. Use MacroAssembler::decrementl() instead.
3929
 emit_int8(0x48 | dst->encoding());
3930
}
3931

3932
#endif // _LP64
3933

3934
// 64bit typically doesn't use the x87 but needs to for the trig funcs
3935

3936
void Assembler::fabs() {
3937
  emit_int8((unsigned char)0xD9);
3938
  emit_int8((unsigned char)0xE1);
3939
}
3940

3941
void Assembler::fadd(int i) {
3942
  emit_farith(0xD8, 0xC0, i);
3943
}
3944

3945
void Assembler::fadd_d(Address src) {
3946
  InstructionMark im(this);
3947
  emit_int8((unsigned char)0xDC);
3948
  emit_operand32(rax, src);
3949
}
3950

3951
void Assembler::fadd_s(Address src) {
3952
  InstructionMark im(this);
3953
  emit_int8((unsigned char)0xD8);
3954
  emit_operand32(rax, src);
3955
}
3956

3957
void Assembler::fadda(int i) {
3958
  emit_farith(0xDC, 0xC0, i);
3959
}
3960

3961
void Assembler::faddp(int i) {
3962
  emit_farith(0xDE, 0xC0, i);
3963
}
3964

3965
void Assembler::fchs() {
3966
  emit_int8((unsigned char)0xD9);
3967
  emit_int8((unsigned char)0xE0);
3968
}
3969

3970
void Assembler::fcom(int i) {
3971
  emit_farith(0xD8, 0xD0, i);
3972
}
3973

3974
void Assembler::fcomp(int i) {
3975
  emit_farith(0xD8, 0xD8, i);
3976
}
3977

3978
void Assembler::fcomp_d(Address src) {
3979
  InstructionMark im(this);
3980
  emit_int8((unsigned char)0xDC);
3981
  emit_operand32(rbx, src);
3982
}
3983

3984
void Assembler::fcomp_s(Address src) {
3985
  InstructionMark im(this);
3986
  emit_int8((unsigned char)0xD8);
3987
  emit_operand32(rbx, src);
3988
}
3989

3990
void Assembler::fcompp() {
3991
  emit_int8((unsigned char)0xDE);
3992
  emit_int8((unsigned char)0xD9);
3993
}
3994

3995
void Assembler::fcos() {
3996
  emit_int8((unsigned char)0xD9);
3997
  emit_int8((unsigned char)0xFF);
3998
}
3999

4000
void Assembler::fdecstp() {
4001
  emit_int8((unsigned char)0xD9);
4002
  emit_int8((unsigned char)0xF6);
4003
}
4004

4005
void Assembler::fdiv(int i) {
4006
  emit_farith(0xD8, 0xF0, i);
4007
}
4008

4009
void Assembler::fdiv_d(Address src) {
4010
  InstructionMark im(this);
4011
  emit_int8((unsigned char)0xDC);
4012
  emit_operand32(rsi, src);
4013
}
4014

4015
void Assembler::fdiv_s(Address src) {
4016
  InstructionMark im(this);
4017
  emit_int8((unsigned char)0xD8);
4018
  emit_operand32(rsi, src);
4019
}
4020

4021
void Assembler::fdiva(int i) {
4022
  emit_farith(0xDC, 0xF8, i);
4023
}
4024

4025
// Note: The Intel manual (Pentium Processor User's Manual, Vol.3, 1994)
4026
//       is erroneous for some of the floating-point instructions below.
4027

4028
void Assembler::fdivp(int i) {
4029
  emit_farith(0xDE, 0xF8, i);                    // ST(0) <- ST(0) / ST(1) and pop (Intel manual wrong)
4030
}
4031

4032
void Assembler::fdivr(int i) {
4033
  emit_farith(0xD8, 0xF8, i);
4034
}
4035

4036
void Assembler::fdivr_d(Address src) {
4037
  InstructionMark im(this);
4038
  emit_int8((unsigned char)0xDC);
4039
  emit_operand32(rdi, src);
4040
}
4041

4042
void Assembler::fdivr_s(Address src) {
4043
  InstructionMark im(this);
4044
  emit_int8((unsigned char)0xD8);
4045
  emit_operand32(rdi, src);
4046
}
4047

4048
void Assembler::fdivra(int i) {
4049
  emit_farith(0xDC, 0xF0, i);
4050
}
4051

4052
void Assembler::fdivrp(int i) {
4053
  emit_farith(0xDE, 0xF0, i);                    // ST(0) <- ST(1) / ST(0) and pop (Intel manual wrong)
4054
}
4055

4056
void Assembler::ffree(int i) {
4057
  emit_farith(0xDD, 0xC0, i);
4058
}
4059

4060
void Assembler::fild_d(Address adr) {
4061
  InstructionMark im(this);
4062
  emit_int8((unsigned char)0xDF);
4063
  emit_operand32(rbp, adr);
4064
}
4065

4066
void Assembler::fild_s(Address adr) {
4067
  InstructionMark im(this);
4068
  emit_int8((unsigned char)0xDB);
4069
  emit_operand32(rax, adr);
4070
}
4071

4072
void Assembler::fincstp() {
4073
  emit_int8((unsigned char)0xD9);
4074
  emit_int8((unsigned char)0xF7);
4075
}
4076

4077
void Assembler::finit() {
4078
  emit_int8((unsigned char)0x9B);
4079
  emit_int8((unsigned char)0xDB);
4080
  emit_int8((unsigned char)0xE3);
4081
}
4082

4083
void Assembler::fist_s(Address adr) {
4084
  InstructionMark im(this);
4085
  emit_int8((unsigned char)0xDB);
4086
  emit_operand32(rdx, adr);
4087
}
4088

4089
void Assembler::fistp_d(Address adr) {
4090
  InstructionMark im(this);
4091
  emit_int8((unsigned char)0xDF);
4092
  emit_operand32(rdi, adr);
4093
}
4094

4095
void Assembler::fistp_s(Address adr) {
4096
  InstructionMark im(this);
4097
  emit_int8((unsigned char)0xDB);
4098
  emit_operand32(rbx, adr);
4099
}
4100

4101
void Assembler::fld1() {
4102
  emit_int8((unsigned char)0xD9);
4103
  emit_int8((unsigned char)0xE8);
4104
}
4105

4106
void Assembler::fld_d(Address adr) {
4107
  InstructionMark im(this);
4108
  emit_int8((unsigned char)0xDD);
4109
  emit_operand32(rax, adr);
4110
}
4111

4112
void Assembler::fld_s(Address adr) {
4113
  InstructionMark im(this);
4114
  emit_int8((unsigned char)0xD9);
4115
  emit_operand32(rax, adr);
4116
}
4117

4118

4119
void Assembler::fld_s(int index) {
4120
  emit_farith(0xD9, 0xC0, index);
4121
}
4122

4123
void Assembler::fld_x(Address adr) {
4124
  InstructionMark im(this);
4125
  emit_int8((unsigned char)0xDB);
4126
  emit_operand32(rbp, adr);
4127
}
4128

4129
void Assembler::fldcw(Address src) {
4130
  InstructionMark im(this);
4131
  emit_int8((unsigned char)0xD9);
4132
  emit_operand32(rbp, src);
4133
}
4134

4135
void Assembler::fldenv(Address src) {
4136
  InstructionMark im(this);
4137
  emit_int8((unsigned char)0xD9);
4138
  emit_operand32(rsp, src);
4139
}
4140

4141
void Assembler::fldlg2() {
4142
  emit_int8((unsigned char)0xD9);
4143
  emit_int8((unsigned char)0xEC);
4144
}
4145

4146
void Assembler::fldln2() {
4147
  emit_int8((unsigned char)0xD9);
4148
  emit_int8((unsigned char)0xED);
4149
}
4150

4151
void Assembler::fldz() {
4152
  emit_int8((unsigned char)0xD9);
4153
  emit_int8((unsigned char)0xEE);
4154
}
4155

4156
void Assembler::flog() {
4157
  fldln2();
4158
  fxch();
4159
  fyl2x();
4160
}
4161

4162
void Assembler::flog10() {
4163
  fldlg2();
4164
  fxch();
4165
  fyl2x();
4166
}
4167

4168
void Assembler::fmul(int i) {
4169
  emit_farith(0xD8, 0xC8, i);
4170
}
4171

4172
void Assembler::fmul_d(Address src) {
4173
  InstructionMark im(this);
4174
  emit_int8((unsigned char)0xDC);
4175
  emit_operand32(rcx, src);
4176
}
4177

4178
void Assembler::fmul_s(Address src) {
4179
  InstructionMark im(this);
4180
  emit_int8((unsigned char)0xD8);
4181
  emit_operand32(rcx, src);
4182
}
4183

4184
void Assembler::fmula(int i) {
4185
  emit_farith(0xDC, 0xC8, i);
4186
}
4187

4188
void Assembler::fmulp(int i) {
4189
  emit_farith(0xDE, 0xC8, i);
4190
}
4191

4192
void Assembler::fnsave(Address dst) {
4193
  InstructionMark im(this);
4194
  emit_int8((unsigned char)0xDD);
4195
  emit_operand32(rsi, dst);
4196
}
4197

4198
void Assembler::fnstcw(Address src) {
4199
  InstructionMark im(this);
4200
  emit_int8((unsigned char)0x9B);
4201
  emit_int8((unsigned char)0xD9);
4202
  emit_operand32(rdi, src);
4203
}
4204

4205
void Assembler::fnstsw_ax() {
4206
  emit_int8((unsigned char)0xDF);
4207
  emit_int8((unsigned char)0xE0);
4208
}
4209

4210
void Assembler::fprem() {
4211
  emit_int8((unsigned char)0xD9);
4212
  emit_int8((unsigned char)0xF8);
4213
}
4214

4215
void Assembler::fprem1() {
4216
  emit_int8((unsigned char)0xD9);
4217
  emit_int8((unsigned char)0xF5);
4218
}
4219

4220
void Assembler::frstor(Address src) {
4221
  InstructionMark im(this);
4222
  emit_int8((unsigned char)0xDD);
4223
  emit_operand32(rsp, src);
4224
}
4225

4226
void Assembler::fsin() {
4227
  emit_int8((unsigned char)0xD9);
4228
  emit_int8((unsigned char)0xFE);
4229
}
4230

4231
void Assembler::fsqrt() {
4232
  emit_int8((unsigned char)0xD9);
4233
  emit_int8((unsigned char)0xFA);
4234
}
4235

4236
void Assembler::fst_d(Address adr) {
4237
  InstructionMark im(this);
4238
  emit_int8((unsigned char)0xDD);
4239
  emit_operand32(rdx, adr);
4240
}
4241

4242
void Assembler::fst_s(Address adr) {
4243
  InstructionMark im(this);
4244
  emit_int8((unsigned char)0xD9);
4245
  emit_operand32(rdx, adr);
4246
}
4247

4248
void Assembler::fstp_d(Address adr) {
4249
  InstructionMark im(this);
4250
  emit_int8((unsigned char)0xDD);
4251
  emit_operand32(rbx, adr);
4252
}
4253

4254
void Assembler::fstp_d(int index) {
4255
  emit_farith(0xDD, 0xD8, index);
4256
}
4257

4258
void Assembler::fstp_s(Address adr) {
4259
  InstructionMark im(this);
4260
  emit_int8((unsigned char)0xD9);
4261
  emit_operand32(rbx, adr);
4262
}
4263

4264
void Assembler::fstp_x(Address adr) {
4265
  InstructionMark im(this);
4266
  emit_int8((unsigned char)0xDB);
4267
  emit_operand32(rdi, adr);
4268
}
4269

4270
void Assembler::fsub(int i) {
4271
  emit_farith(0xD8, 0xE0, i);
4272
}
4273

4274
void Assembler::fsub_d(Address src) {
4275
  InstructionMark im(this);
4276
  emit_int8((unsigned char)0xDC);
4277
  emit_operand32(rsp, src);
4278
}
4279

4280
void Assembler::fsub_s(Address src) {
4281
  InstructionMark im(this);
4282
  emit_int8((unsigned char)0xD8);
4283
  emit_operand32(rsp, src);
4284
}
4285

4286
void Assembler::fsuba(int i) {
4287
  emit_farith(0xDC, 0xE8, i);
4288
}
4289

4290
void Assembler::fsubp(int i) {
4291
  emit_farith(0xDE, 0xE8, i);                    // ST(0) <- ST(0) - ST(1) and pop (Intel manual wrong)
4292
}
4293

4294
void Assembler::fsubr(int i) {
4295
  emit_farith(0xD8, 0xE8, i);
4296
}
4297

4298
void Assembler::fsubr_d(Address src) {
4299
  InstructionMark im(this);
4300
  emit_int8((unsigned char)0xDC);
4301
  emit_operand32(rbp, src);
4302
}
4303

4304
void Assembler::fsubr_s(Address src) {
4305
  InstructionMark im(this);
4306
  emit_int8((unsigned char)0xD8);
4307
  emit_operand32(rbp, src);
4308
}
4309

4310
void Assembler::fsubra(int i) {
4311
  emit_farith(0xDC, 0xE0, i);
4312
}
4313

4314
void Assembler::fsubrp(int i) {
4315
  emit_farith(0xDE, 0xE0, i);                    // ST(0) <- ST(1) - ST(0) and pop (Intel manual wrong)
4316
}
4317

4318
void Assembler::ftan() {
4319
  emit_int8((unsigned char)0xD9);
4320
  emit_int8((unsigned char)0xF2);
4321
  emit_int8((unsigned char)0xDD);
4322
  emit_int8((unsigned char)0xD8);
4323
}
4324

4325
void Assembler::ftst() {
4326
  emit_int8((unsigned char)0xD9);
4327
  emit_int8((unsigned char)0xE4);
4328
}
4329

4330
void Assembler::fucomi(int i) {
4331
  // make sure the instruction is supported (introduced for P6, together with cmov)
4332
  guarantee(VM_Version::supports_cmov(), "illegal instruction");
4333
  emit_farith(0xDB, 0xE8, i);
4334
}
4335

4336
void Assembler::fucomip(int i) {
4337
  // make sure the instruction is supported (introduced for P6, together with cmov)
4338
  guarantee(VM_Version::supports_cmov(), "illegal instruction");
4339
  emit_farith(0xDF, 0xE8, i);
4340
}
4341

4342
void Assembler::fwait() {
4343
  emit_int8((unsigned char)0x9B);
4344
}
4345

4346
void Assembler::fxch(int i) {
4347
  emit_farith(0xD9, 0xC8, i);
4348
}
4349

4350
void Assembler::fyl2x() {
4351
  emit_int8((unsigned char)0xD9);
4352
  emit_int8((unsigned char)0xF1);
4353
}
4354

4355
void Assembler::frndint() {
4356
  emit_int8((unsigned char)0xD9);
4357
  emit_int8((unsigned char)0xFC);
4358
}
4359

4360
void Assembler::f2xm1() {
4361
  emit_int8((unsigned char)0xD9);
4362
  emit_int8((unsigned char)0xF0);
4363
}
4364

4365
void Assembler::fldl2e() {
4366
  emit_int8((unsigned char)0xD9);
4367
  emit_int8((unsigned char)0xEA);
4368
}
4369

4370
// SSE SIMD prefix byte values corresponding to VexSimdPrefix encoding.
4371
static int simd_pre[4] = { 0, 0x66, 0xF3, 0xF2 };
4372
// SSE opcode second byte values (first is 0x0F) corresponding to VexOpcode encoding.
4373
static int simd_opc[4] = { 0,    0, 0x38, 0x3A };
4374

4375
// Generate SSE legacy REX prefix and SIMD opcode based on VEX encoding.
4376
void Assembler::rex_prefix(Address adr, XMMRegister xreg, VexSimdPrefix pre, VexOpcode opc, bool rex_w) {
4377
  if (pre > 0) {
4378
    emit_int8(simd_pre[pre]);
4379
  }
4380
  if (rex_w) {
4381
    prefixq(adr, xreg);
4382
  } else {
4383
    prefix(adr, xreg);
4384
  }
4385
  if (opc > 0) {
4386
    emit_int8(0x0F);
4387
    int opc2 = simd_opc[opc];
4388
    if (opc2 > 0) {
4389
      emit_int8(opc2);
4390
    }
4391
  }
4392
}
4393

4394
int Assembler::rex_prefix_and_encode(int dst_enc, int src_enc, VexSimdPrefix pre, VexOpcode opc, bool rex_w) {
4395
  if (pre > 0) {
4396
    emit_int8(simd_pre[pre]);
4397
  }
4398
  int encode = (rex_w) ? prefixq_and_encode(dst_enc, src_enc) :
4399
                          prefix_and_encode(dst_enc, src_enc);
4400
  if (opc > 0) {
4401
    emit_int8(0x0F);
4402
    int opc2 = simd_opc[opc];
4403
    if (opc2 > 0) {
4404
      emit_int8(opc2);
4405
    }
4406
  }
4407
  return encode;
4408
}
4409

4410

4411
void Assembler::vex_prefix(bool vex_r, bool vex_b, bool vex_x, bool vex_w, int nds_enc, VexSimdPrefix pre, VexOpcode opc, bool vector256) {
4412
  if (vex_b || vex_x || vex_w || (opc == VEX_OPCODE_0F_38) || (opc == VEX_OPCODE_0F_3A)) {
4413
    prefix(VEX_3bytes);
4414

4415
    int byte1 = (vex_r ? VEX_R : 0) | (vex_x ? VEX_X : 0) | (vex_b ? VEX_B : 0);
4416
    byte1 = (~byte1) & 0xE0;
4417
    byte1 |= opc;
4418
    emit_int8(byte1);
4419

4420
    int byte2 = ((~nds_enc) & 0xf) << 3;
4421
    byte2 |= (vex_w ? VEX_W : 0) | (vector256 ? 4 : 0) | pre;
4422
    emit_int8(byte2);
4423
  } else {
4424
    prefix(VEX_2bytes);
4425

4426
    int byte1 = vex_r ? VEX_R : 0;
4427
    byte1 = (~byte1) & 0x80;
4428
    byte1 |= ((~nds_enc) & 0xf) << 3;
4429
    byte1 |= (vector256 ? 4 : 0) | pre;
4430
    emit_int8(byte1);
4431
  }
4432
}
4433

4434
void Assembler::vex_prefix(Address adr, int nds_enc, int xreg_enc, VexSimdPrefix pre, VexOpcode opc, bool vex_w, bool vector256){
4435
  bool vex_r = (xreg_enc >= 8);
4436
  bool vex_b = adr.base_needs_rex();
4437
  bool vex_x = adr.index_needs_rex();
4438
  vex_prefix(vex_r, vex_b, vex_x, vex_w, nds_enc, pre, opc, vector256);
4439
}
4440

4441
int Assembler::vex_prefix_and_encode(int dst_enc, int nds_enc, int src_enc, VexSimdPrefix pre, VexOpcode opc, bool vex_w, bool vector256) {
4442
  bool vex_r = (dst_enc >= 8);
4443
  bool vex_b = (src_enc >= 8);
4444
  bool vex_x = false;
4445
  vex_prefix(vex_r, vex_b, vex_x, vex_w, nds_enc, pre, opc, vector256);
4446
  return (((dst_enc & 7) << 3) | (src_enc & 7));
4447
}
4448

4449

4450
void Assembler::simd_prefix(XMMRegister xreg, XMMRegister nds, Address adr, VexSimdPrefix pre, VexOpcode opc, bool rex_w, bool vector256) {
4451
  if (UseAVX > 0) {
4452
    int xreg_enc = xreg->encoding();
4453
    int  nds_enc = nds->is_valid() ? nds->encoding() : 0;
4454
    vex_prefix(adr, nds_enc, xreg_enc, pre, opc, rex_w, vector256);
4455
  } else {
4456
    assert((nds == xreg) || (nds == xnoreg), "wrong sse encoding");
4457
    rex_prefix(adr, xreg, pre, opc, rex_w);
4458
  }
4459
}
4460

4461
int Assembler::simd_prefix_and_encode(XMMRegister dst, XMMRegister nds, XMMRegister src, VexSimdPrefix pre, VexOpcode opc, bool rex_w, bool vector256) {
4462
  int dst_enc = dst->encoding();
4463
  int src_enc = src->encoding();
4464
  if (UseAVX > 0) {
4465
    int nds_enc = nds->is_valid() ? nds->encoding() : 0;
4466
    return vex_prefix_and_encode(dst_enc, nds_enc, src_enc, pre, opc, rex_w, vector256);
4467
  } else {
4468
    assert((nds == dst) || (nds == src) || (nds == xnoreg), "wrong sse encoding");
4469
    return rex_prefix_and_encode(dst_enc, src_enc, pre, opc, rex_w);
4470
  }
4471
}
4472

4473
void Assembler::emit_simd_arith(int opcode, XMMRegister dst, Address src, VexSimdPrefix pre) {
4474
  InstructionMark im(this);
4475
  simd_prefix(dst, dst, src, pre);
4476
  emit_int8(opcode);
4477
  emit_operand(dst, src);
4478
}
4479

4480
void Assembler::emit_simd_arith(int opcode, XMMRegister dst, XMMRegister src, VexSimdPrefix pre) {
4481
  int encode = simd_prefix_and_encode(dst, dst, src, pre);
4482
  emit_int8(opcode);
4483
  emit_int8((unsigned char)(0xC0 | encode));
4484
}
4485

4486
// Versions with no second source register (non-destructive source).
4487
void Assembler::emit_simd_arith_nonds(int opcode, XMMRegister dst, Address src, VexSimdPrefix pre) {
4488
  InstructionMark im(this);
4489
  simd_prefix(dst, xnoreg, src, pre);
4490
  emit_int8(opcode);
4491
  emit_operand(dst, src);
4492
}
4493

4494
void Assembler::emit_simd_arith_nonds(int opcode, XMMRegister dst, XMMRegister src, VexSimdPrefix pre) {
4495
  int encode = simd_prefix_and_encode(dst, xnoreg, src, pre);
4496
  emit_int8(opcode);
4497
  emit_int8((unsigned char)(0xC0 | encode));
4498
}
4499

4500
// 3-operands AVX instructions
4501
void Assembler::emit_vex_arith(int opcode, XMMRegister dst, XMMRegister nds,
4502
                               Address src, VexSimdPrefix pre, bool vector256) {
4503
  InstructionMark im(this);
4504
  vex_prefix(dst, nds, src, pre, vector256);
4505
  emit_int8(opcode);
4506
  emit_operand(dst, src);
4507
}
4508

4509
void Assembler::emit_vex_arith(int opcode, XMMRegister dst, XMMRegister nds,
4510
                               XMMRegister src, VexSimdPrefix pre, bool vector256) {
4511
  int encode = vex_prefix_and_encode(dst, nds, src, pre, vector256);
4512
  emit_int8(opcode);
4513
  emit_int8((unsigned char)(0xC0 | encode));
4514
}
4515

4516
#ifndef _LP64
4517

4518
void Assembler::incl(Register dst) {
4519
  // Don't use it directly. Use MacroAssembler::incrementl() instead.
4520
  emit_int8(0x40 | dst->encoding());
4521
}
4522

4523
void Assembler::lea(Register dst, Address src) {
4524
  leal(dst, src);
4525
}
4526

4527
void Assembler::mov_literal32(Address dst, int32_t imm32,  RelocationHolder const& rspec) {
4528
  InstructionMark im(this);
4529
  emit_int8((unsigned char)0xC7);
4530
  emit_operand(rax, dst);
4531
  emit_data((int)imm32, rspec, 0);
4532
}
4533

4534
void Assembler::mov_literal32(Register dst, int32_t imm32, RelocationHolder const& rspec) {
4535
  InstructionMark im(this);
4536
  int encode = prefix_and_encode(dst->encoding());
4537
  emit_int8((unsigned char)(0xB8 | encode));
4538
  emit_data((int)imm32, rspec, 0);
4539
}
4540

4541
void Assembler::popa() { // 32bit
4542
  emit_int8(0x61);
4543
}
4544

4545
void Assembler::push_literal32(int32_t imm32, RelocationHolder const& rspec) {
4546
  InstructionMark im(this);
4547
  emit_int8(0x68);
4548
  emit_data(imm32, rspec, 0);
4549
}
4550

4551
void Assembler::pusha() { // 32bit
4552
  emit_int8(0x60);
4553
}
4554

4555
void Assembler::set_byte_if_not_zero(Register dst) {
4556
  emit_int8(0x0F);
4557
  emit_int8((unsigned char)0x95);
4558
  emit_int8((unsigned char)(0xE0 | dst->encoding()));
4559
}
4560

4561
void Assembler::shldl(Register dst, Register src) {
4562
  emit_int8(0x0F);
4563
  emit_int8((unsigned char)0xA5);
4564
  emit_int8((unsigned char)(0xC0 | src->encoding() << 3 | dst->encoding()));
4565
}
4566

4567
void Assembler::shrdl(Register dst, Register src) {
4568
  emit_int8(0x0F);
4569
  emit_int8((unsigned char)0xAD);
4570
  emit_int8((unsigned char)(0xC0 | src->encoding() << 3 | dst->encoding()));
4571
}
4572

4573
#else // LP64
4574

4575
void Assembler::set_byte_if_not_zero(Register dst) {
4576
  int enc = prefix_and_encode(dst->encoding(), true);
4577
  emit_int8(0x0F);
4578
  emit_int8((unsigned char)0x95);
4579
  emit_int8((unsigned char)(0xE0 | enc));
4580
}
4581

4582
// 64bit only pieces of the assembler
4583
// This should only be used by 64bit instructions that can use rip-relative
4584
// it cannot be used by instructions that want an immediate value.
4585

4586
bool Assembler::reachable(AddressLiteral adr) {
4587
  int64_t disp;
4588
  // None will force a 64bit literal to the code stream. Likely a placeholder
4589
  // for something that will be patched later and we need to certain it will
4590
  // always be reachable.
4591
  if (adr.reloc() == relocInfo::none) {
4592
    return false;
4593
  }
4594
  if (adr.reloc() == relocInfo::internal_word_type) {
4595
    // This should be rip relative and easily reachable.
4596
    return true;
4597
  }
4598
  if (adr.reloc() == relocInfo::virtual_call_type ||
4599
      adr.reloc() == relocInfo::opt_virtual_call_type ||
4600
      adr.reloc() == relocInfo::static_call_type ||
4601
      adr.reloc() == relocInfo::static_stub_type ) {
4602
    // This should be rip relative within the code cache and easily
4603
    // reachable until we get huge code caches. (At which point
4604
    // ic code is going to have issues).
4605
    return true;
4606
  }
4607
  if (adr.reloc() != relocInfo::external_word_type &&
4608
      adr.reloc() != relocInfo::poll_return_type &&  // these are really external_word but need special
4609
      adr.reloc() != relocInfo::poll_type &&         // relocs to identify them
4610
      adr.reloc() != relocInfo::runtime_call_type ) {
4611
    return false;
4612
  }
4613

4614
  // Stress the correction code
4615
  if (ForceUnreachable) {
4616
    // Must be runtimecall reloc, see if it is in the codecache
4617
    // Flipping stuff in the codecache to be unreachable causes issues
4618
    // with things like inline caches where the additional instructions
4619
    // are not handled.
4620
    if (CodeCache::find_blob(adr._target) == NULL) {
4621
      return false;
4622
    }
4623
  }
4624
  // For external_word_type/runtime_call_type if it is reachable from where we
4625
  // are now (possibly a temp buffer) and where we might end up
4626
  // anywhere in the codeCache then we are always reachable.
4627
  // This would have to change if we ever save/restore shared code
4628
  // to be more pessimistic.
4629
  disp = (int64_t)adr._target - ((int64_t)CodeCache::low_bound() + sizeof(int));
4630
  if (!is_simm32(disp)) return false;
4631
  disp = (int64_t)adr._target - ((int64_t)CodeCache::high_bound() + sizeof(int));
4632
  if (!is_simm32(disp)) return false;
4633

4634
  disp = (int64_t)adr._target - ((int64_t)pc() + sizeof(int));
4635

4636
  // Because rip relative is a disp + address_of_next_instruction and we
4637
  // don't know the value of address_of_next_instruction we apply a fudge factor
4638
  // to make sure we will be ok no matter the size of the instruction we get placed into.
4639
  // We don't have to fudge the checks above here because they are already worst case.
4640

4641
  // 12 == override/rex byte, opcode byte, rm byte, sib byte, a 4-byte disp , 4-byte literal
4642
  // + 4 because better safe than sorry.
4643
  const int fudge = 12 + 4;
4644
  if (disp < 0) {
4645
    disp -= fudge;
4646
  } else {
4647
    disp += fudge;
4648
  }
4649
  return is_simm32(disp);
4650
}
4651

4652
// Check if the polling page is not reachable from the code cache using rip-relative
4653
// addressing.
4654
bool Assembler::is_polling_page_far() {
4655
  intptr_t addr = (intptr_t)os::get_polling_page();
4656
  return ForceUnreachable ||
4657
         !is_simm32(addr - (intptr_t)CodeCache::low_bound()) ||
4658
         !is_simm32(addr - (intptr_t)CodeCache::high_bound());
4659
}
4660

4661
void Assembler::emit_data64(jlong data,
4662
                            relocInfo::relocType rtype,
4663
                            int format) {
4664
  if (rtype == relocInfo::none) {
4665
    emit_int64(data);
4666
  } else {
4667
    emit_data64(data, Relocation::spec_simple(rtype), format);
4668
  }
4669
}
4670

4671
void Assembler::emit_data64(jlong data,
4672
                            RelocationHolder const& rspec,
4673
                            int format) {
4674
  assert(imm_operand == 0, "default format must be immediate in this file");
4675
  assert(imm_operand == format, "must be immediate");
4676
  assert(inst_mark() != NULL, "must be inside InstructionMark");
4677
  // Do not use AbstractAssembler::relocate, which is not intended for
4678
  // embedded words.  Instead, relocate to the enclosing instruction.
4679
  code_section()->relocate(inst_mark(), rspec, format);
4680
#ifdef ASSERT
4681
  check_relocation(rspec, format);
4682
#endif
4683
  emit_int64(data);
4684
}
4685

4686
int Assembler::prefix_and_encode(int reg_enc, bool byteinst) {
4687
  if (reg_enc >= 8) {
4688
    prefix(REX_B);
4689
    reg_enc -= 8;
4690
  } else if (byteinst && reg_enc >= 4) {
4691
    prefix(REX);
4692
  }
4693
  return reg_enc;
4694
}
4695

4696
int Assembler::prefixq_and_encode(int reg_enc) {
4697
  if (reg_enc < 8) {
4698
    prefix(REX_W);
4699
  } else {
4700
    prefix(REX_WB);
4701
    reg_enc -= 8;
4702
  }
4703
  return reg_enc;
4704
}
4705

4706
int Assembler::prefix_and_encode(int dst_enc, int src_enc, bool byteinst) {
4707
  if (dst_enc < 8) {
4708
    if (src_enc >= 8) {
4709
      prefix(REX_B);
4710
      src_enc -= 8;
4711
    } else if (byteinst && src_enc >= 4) {
4712
      prefix(REX);
4713
    }
4714
  } else {
4715
    if (src_enc < 8) {
4716
      prefix(REX_R);
4717
    } else {
4718
      prefix(REX_RB);
4719
      src_enc -= 8;
4720
    }
4721
    dst_enc -= 8;
4722
  }
4723
  return dst_enc << 3 | src_enc;
4724
}
4725

4726
int Assembler::prefixq_and_encode(int dst_enc, int src_enc) {
4727
  if (dst_enc < 8) {
4728
    if (src_enc < 8) {
4729
      prefix(REX_W);
4730
    } else {
4731
      prefix(REX_WB);
4732
      src_enc -= 8;
4733
    }
4734
  } else {
4735
    if (src_enc < 8) {
4736
      prefix(REX_WR);
4737
    } else {
4738
      prefix(REX_WRB);
4739
      src_enc -= 8;
4740
    }
4741
    dst_enc -= 8;
4742
  }
4743
  return dst_enc << 3 | src_enc;
4744
}
4745

4746
void Assembler::prefix(Register reg) {
4747
  if (reg->encoding() >= 8) {
4748
    prefix(REX_B);
4749
  }
4750
}
4751

4752
void Assembler::prefix(Address adr) {
4753
  if (adr.base_needs_rex()) {
4754
    if (adr.index_needs_rex()) {
4755
      prefix(REX_XB);
4756
    } else {
4757
      prefix(REX_B);
4758
    }
4759
  } else {
4760
    if (adr.index_needs_rex()) {
4761
      prefix(REX_X);
4762
    }
4763
  }
4764
}
4765

4766
void Assembler::prefixq(Address adr) {
4767
  if (adr.base_needs_rex()) {
4768
    if (adr.index_needs_rex()) {
4769
      prefix(REX_WXB);
4770
    } else {
4771
      prefix(REX_WB);
4772
    }
4773
  } else {
4774
    if (adr.index_needs_rex()) {
4775
      prefix(REX_WX);
4776
    } else {
4777
      prefix(REX_W);
4778
    }
4779
  }
4780
}
4781

4782

4783
void Assembler::prefix(Address adr, Register reg, bool byteinst) {
4784
  if (reg->encoding() < 8) {
4785
    if (adr.base_needs_rex()) {
4786
      if (adr.index_needs_rex()) {
4787
        prefix(REX_XB);
4788
      } else {
4789
        prefix(REX_B);
4790
      }
4791
    } else {
4792
      if (adr.index_needs_rex()) {
4793
        prefix(REX_X);
4794
      } else if (byteinst && reg->encoding() >= 4 ) {
4795
        prefix(REX);
4796
      }
4797
    }
4798
  } else {
4799
    if (adr.base_needs_rex()) {
4800
      if (adr.index_needs_rex()) {
4801
        prefix(REX_RXB);
4802
      } else {
4803
        prefix(REX_RB);
4804
      }
4805
    } else {
4806
      if (adr.index_needs_rex()) {
4807
        prefix(REX_RX);
4808
      } else {
4809
        prefix(REX_R);
4810
      }
4811
    }
4812
  }
4813
}
4814

4815
void Assembler::prefixq(Address adr, Register src) {
4816
  if (src->encoding() < 8) {
4817
    if (adr.base_needs_rex()) {
4818
      if (adr.index_needs_rex()) {
4819
        prefix(REX_WXB);
4820
      } else {
4821
        prefix(REX_WB);
4822
      }
4823
    } else {
4824
      if (adr.index_needs_rex()) {
4825
        prefix(REX_WX);
4826
      } else {
4827
        prefix(REX_W);
4828
      }
4829
    }
4830
  } else {
4831
    if (adr.base_needs_rex()) {
4832
      if (adr.index_needs_rex()) {
4833
        prefix(REX_WRXB);
4834
      } else {
4835
        prefix(REX_WRB);
4836
      }
4837
    } else {
4838
      if (adr.index_needs_rex()) {
4839
        prefix(REX_WRX);
4840
      } else {
4841
        prefix(REX_WR);
4842
      }
4843
    }
4844
  }
4845
}
4846

4847
void Assembler::prefix(Address adr, XMMRegister reg) {
4848
  if (reg->encoding() < 8) {
4849
    if (adr.base_needs_rex()) {
4850
      if (adr.index_needs_rex()) {
4851
        prefix(REX_XB);
4852
      } else {
4853
        prefix(REX_B);
4854
      }
4855
    } else {
4856
      if (adr.index_needs_rex()) {
4857
        prefix(REX_X);
4858
      }
4859
    }
4860
  } else {
4861
    if (adr.base_needs_rex()) {
4862
      if (adr.index_needs_rex()) {
4863
        prefix(REX_RXB);
4864
      } else {
4865
        prefix(REX_RB);
4866
      }
4867
    } else {
4868
      if (adr.index_needs_rex()) {
4869
        prefix(REX_RX);
4870
      } else {
4871
        prefix(REX_R);
4872
      }
4873
    }
4874
  }
4875
}
4876

4877
void Assembler::prefixq(Address adr, XMMRegister src) {
4878
  if (src->encoding() < 8) {
4879
    if (adr.base_needs_rex()) {
4880
      if (adr.index_needs_rex()) {
4881
        prefix(REX_WXB);
4882
      } else {
4883
        prefix(REX_WB);
4884
      }
4885
    } else {
4886
      if (adr.index_needs_rex()) {
4887
        prefix(REX_WX);
4888
      } else {
4889
        prefix(REX_W);
4890
      }
4891
    }
4892
  } else {
4893
    if (adr.base_needs_rex()) {
4894
      if (adr.index_needs_rex()) {
4895
        prefix(REX_WRXB);
4896
      } else {
4897
        prefix(REX_WRB);
4898
      }
4899
    } else {
4900
      if (adr.index_needs_rex()) {
4901
        prefix(REX_WRX);
4902
      } else {
4903
        prefix(REX_WR);
4904
      }
4905
    }
4906
  }
4907
}
4908

4909
void Assembler::adcq(Register dst, int32_t imm32) {
4910
  (void) prefixq_and_encode(dst->encoding());
4911
  emit_arith(0x81, 0xD0, dst, imm32);
4912
}
4913

4914
void Assembler::adcq(Register dst, Address src) {
4915
  InstructionMark im(this);
4916
  prefixq(src, dst);
4917
  emit_int8(0x13);
4918
  emit_operand(dst, src);
4919
}
4920

4921
void Assembler::adcq(Register dst, Register src) {
4922
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
4923
  emit_arith(0x13, 0xC0, dst, src);
4924
}
4925

4926
void Assembler::addq(Address dst, int32_t imm32) {
4927
  InstructionMark im(this);
4928
  prefixq(dst);
4929
  emit_arith_operand(0x81, rax, dst,imm32);
4930
}
4931

4932
void Assembler::addq(Address dst, Register src) {
4933
  InstructionMark im(this);
4934
  prefixq(dst, src);
4935
  emit_int8(0x01);
4936
  emit_operand(src, dst);
4937
}
4938

4939
void Assembler::addq(Register dst, int32_t imm32) {
4940
  (void) prefixq_and_encode(dst->encoding());
4941
  emit_arith(0x81, 0xC0, dst, imm32);
4942
}
4943

4944
void Assembler::addq(Register dst, Address src) {
4945
  InstructionMark im(this);
4946
  prefixq(src, dst);
4947
  emit_int8(0x03);
4948
  emit_operand(dst, src);
4949
}
4950

4951
void Assembler::addq(Register dst, Register src) {
4952
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
4953
  emit_arith(0x03, 0xC0, dst, src);
4954
}
4955

4956
void Assembler::adcxq(Register dst, Register src) {
4957
  //assert(VM_Version::supports_adx(), "adx instructions not supported");
4958
  emit_int8((unsigned char)0x66);
4959
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
4960
  emit_int8(0x0F);
4961
  emit_int8(0x38);
4962
  emit_int8((unsigned char)0xF6);
4963
  emit_int8((unsigned char)(0xC0 | encode));
4964
}
4965

4966
void Assembler::adoxq(Register dst, Register src) {
4967
  //assert(VM_Version::supports_adx(), "adx instructions not supported");
4968
  emit_int8((unsigned char)0xF3);
4969
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
4970
  emit_int8(0x0F);
4971
  emit_int8(0x38);
4972
  emit_int8((unsigned char)0xF6);
4973
  emit_int8((unsigned char)(0xC0 | encode));
4974
}
4975

4976
void Assembler::andq(Address dst, int32_t imm32) {
4977
  InstructionMark im(this);
4978
  prefixq(dst);
4979
  emit_int8((unsigned char)0x81);
4980
  emit_operand(rsp, dst, 4);
4981
  emit_int32(imm32);
4982
}
4983

4984
void Assembler::andq(Register dst, int32_t imm32) {
4985
  (void) prefixq_and_encode(dst->encoding());
4986
  emit_arith(0x81, 0xE0, dst, imm32);
4987
}
4988

4989
void Assembler::andq(Register dst, Address src) {
4990
  InstructionMark im(this);
4991
  prefixq(src, dst);
4992
  emit_int8(0x23);
4993
  emit_operand(dst, src);
4994
}
4995

4996
void Assembler::andq(Register dst, Register src) {
4997
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
4998
  emit_arith(0x23, 0xC0, dst, src);
4999
}
5000

5001
void Assembler::andnq(Register dst, Register src1, Register src2) {
5002
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5003
  int encode = vex_prefix_0F38_and_encode_q(dst, src1, src2);
5004
  emit_int8((unsigned char)0xF2);
5005
  emit_int8((unsigned char)(0xC0 | encode));
5006
}
5007

5008
void Assembler::andnq(Register dst, Register src1, Address src2) {
5009
  InstructionMark im(this);
5010
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5011
  vex_prefix_0F38_q(dst, src1, src2);
5012
  emit_int8((unsigned char)0xF2);
5013
  emit_operand(dst, src2);
5014
}
5015

5016
void Assembler::bsfq(Register dst, Register src) {
5017
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5018
  emit_int8(0x0F);
5019
  emit_int8((unsigned char)0xBC);
5020
  emit_int8((unsigned char)(0xC0 | encode));
5021
}
5022

5023
void Assembler::bsrq(Register dst, Register src) {
5024
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5025
  emit_int8(0x0F);
5026
  emit_int8((unsigned char)0xBD);
5027
  emit_int8((unsigned char)(0xC0 | encode));
5028
}
5029

5030
void Assembler::bswapq(Register reg) {
5031
  int encode = prefixq_and_encode(reg->encoding());
5032
  emit_int8(0x0F);
5033
  emit_int8((unsigned char)(0xC8 | encode));
5034
}
5035

5036
void Assembler::blsiq(Register dst, Register src) {
5037
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5038
  int encode = vex_prefix_0F38_and_encode_q(rbx, dst, src);
5039
  emit_int8((unsigned char)0xF3);
5040
  emit_int8((unsigned char)(0xC0 | encode));
5041
}
5042

5043
void Assembler::blsiq(Register dst, Address src) {
5044
  InstructionMark im(this);
5045
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5046
  vex_prefix_0F38_q(rbx, dst, src);
5047
  emit_int8((unsigned char)0xF3);
5048
  emit_operand(rbx, src);
5049
}
5050

5051
void Assembler::blsmskq(Register dst, Register src) {
5052
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5053
  int encode = vex_prefix_0F38_and_encode_q(rdx, dst, src);
5054
  emit_int8((unsigned char)0xF3);
5055
  emit_int8((unsigned char)(0xC0 | encode));
5056
}
5057

5058
void Assembler::blsmskq(Register dst, Address src) {
5059
  InstructionMark im(this);
5060
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5061
  vex_prefix_0F38_q(rdx, dst, src);
5062
  emit_int8((unsigned char)0xF3);
5063
  emit_operand(rdx, src);
5064
}
5065

5066
void Assembler::blsrq(Register dst, Register src) {
5067
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5068
  int encode = vex_prefix_0F38_and_encode_q(rcx, dst, src);
5069
  emit_int8((unsigned char)0xF3);
5070
  emit_int8((unsigned char)(0xC0 | encode));
5071
}
5072

5073
void Assembler::blsrq(Register dst, Address src) {
5074
  InstructionMark im(this);
5075
  assert(VM_Version::supports_bmi1(), "bit manipulation instructions not supported");
5076
  vex_prefix_0F38_q(rcx, dst, src);
5077
  emit_int8((unsigned char)0xF3);
5078
  emit_operand(rcx, src);
5079
}
5080

5081
void Assembler::cdqq() {
5082
  prefix(REX_W);
5083
  emit_int8((unsigned char)0x99);
5084
}
5085

5086
void Assembler::clflush(Address adr) {
5087
  prefix(adr);
5088
  emit_int8(0x0F);
5089
  emit_int8((unsigned char)0xAE);
5090
  emit_operand(rdi, adr);
5091
}
5092

5093
void Assembler::cmovq(Condition cc, Register dst, Register src) {
5094
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5095
  emit_int8(0x0F);
5096
  emit_int8(0x40 | cc);
5097
  emit_int8((unsigned char)(0xC0 | encode));
5098
}
5099

5100
void Assembler::cmovq(Condition cc, Register dst, Address src) {
5101
  InstructionMark im(this);
5102
  prefixq(src, dst);
5103
  emit_int8(0x0F);
5104
  emit_int8(0x40 | cc);
5105
  emit_operand(dst, src);
5106
}
5107

5108
void Assembler::cmpq(Address dst, int32_t imm32) {
5109
  InstructionMark im(this);
5110
  prefixq(dst);
5111
  emit_int8((unsigned char)0x81);
5112
  emit_operand(rdi, dst, 4);
5113
  emit_int32(imm32);
5114
}
5115

5116
void Assembler::cmpq(Register dst, int32_t imm32) {
5117
  (void) prefixq_and_encode(dst->encoding());
5118
  emit_arith(0x81, 0xF8, dst, imm32);
5119
}
5120

5121
void Assembler::cmpq(Address dst, Register src) {
5122
  InstructionMark im(this);
5123
  prefixq(dst, src);
5124
  emit_int8(0x3B);
5125
  emit_operand(src, dst);
5126
}
5127

5128
void Assembler::cmpq(Register dst, Register src) {
5129
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5130
  emit_arith(0x3B, 0xC0, dst, src);
5131
}
5132

5133
void Assembler::cmpq(Register dst, Address  src) {
5134
  InstructionMark im(this);
5135
  prefixq(src, dst);
5136
  emit_int8(0x3B);
5137
  emit_operand(dst, src);
5138
}
5139

5140
void Assembler::cmpxchgq(Register reg, Address adr) {
5141
  InstructionMark im(this);
5142
  prefixq(adr, reg);
5143
  emit_int8(0x0F);
5144
  emit_int8((unsigned char)0xB1);
5145
  emit_operand(reg, adr);
5146
}
5147

5148
void Assembler::cvtsi2sdq(XMMRegister dst, Register src) {
5149
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
5150
  int encode = simd_prefix_and_encode_q(dst, dst, src, VEX_SIMD_F2);
5151
  emit_int8(0x2A);
5152
  emit_int8((unsigned char)(0xC0 | encode));
5153
}
5154

5155
void Assembler::cvtsi2sdq(XMMRegister dst, Address src) {
5156
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
5157
  InstructionMark im(this);
5158
  simd_prefix_q(dst, dst, src, VEX_SIMD_F2);
5159
  emit_int8(0x2A);
5160
  emit_operand(dst, src);
5161
}
5162

5163
void Assembler::cvtsi2ssq(XMMRegister dst, Register src) {
5164
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
5165
  int encode = simd_prefix_and_encode_q(dst, dst, src, VEX_SIMD_F3);
5166
  emit_int8(0x2A);
5167
  emit_int8((unsigned char)(0xC0 | encode));
5168
}
5169

5170
void Assembler::cvtsi2ssq(XMMRegister dst, Address src) {
5171
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
5172
  InstructionMark im(this);
5173
  simd_prefix_q(dst, dst, src, VEX_SIMD_F3);
5174
  emit_int8(0x2A);
5175
  emit_operand(dst, src);
5176
}
5177

5178
void Assembler::cvttsd2siq(Register dst, XMMRegister src) {
5179
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
5180
  int encode = simd_prefix_and_encode_q(dst, src, VEX_SIMD_F2);
5181
  emit_int8(0x2C);
5182
  emit_int8((unsigned char)(0xC0 | encode));
5183
}
5184

5185
void Assembler::cvttss2siq(Register dst, XMMRegister src) {
5186
  NOT_LP64(assert(VM_Version::supports_sse(), ""));
5187
  int encode = simd_prefix_and_encode_q(dst, src, VEX_SIMD_F3);
5188
  emit_int8(0x2C);
5189
  emit_int8((unsigned char)(0xC0 | encode));
5190
}
5191

5192
void Assembler::decl(Register dst) {
5193
  // Don't use it directly. Use MacroAssembler::decrementl() instead.
5194
  // Use two-byte form (one-byte form is a REX prefix in 64-bit mode)
5195
  int encode = prefix_and_encode(dst->encoding());
5196
  emit_int8((unsigned char)0xFF);
5197
  emit_int8((unsigned char)(0xC8 | encode));
5198
}
5199

5200
void Assembler::decq(Register dst) {
5201
  // Don't use it directly. Use MacroAssembler::decrementq() instead.
5202
  // Use two-byte form (one-byte from is a REX prefix in 64-bit mode)
5203
  int encode = prefixq_and_encode(dst->encoding());
5204
  emit_int8((unsigned char)0xFF);
5205
  emit_int8(0xC8 | encode);
5206
}
5207

5208
void Assembler::decq(Address dst) {
5209
  // Don't use it directly. Use MacroAssembler::decrementq() instead.
5210
  InstructionMark im(this);
5211
  prefixq(dst);
5212
  emit_int8((unsigned char)0xFF);
5213
  emit_operand(rcx, dst);
5214
}
5215

5216
void Assembler::fxrstor(Address src) {
5217
  prefixq(src);
5218
  emit_int8(0x0F);
5219
  emit_int8((unsigned char)0xAE);
5220
  emit_operand(as_Register(1), src);
5221
}
5222

5223
void Assembler::fxsave(Address dst) {
5224
  prefixq(dst);
5225
  emit_int8(0x0F);
5226
  emit_int8((unsigned char)0xAE);
5227
  emit_operand(as_Register(0), dst);
5228
}
5229

5230
void Assembler::idivq(Register src) {
5231
  int encode = prefixq_and_encode(src->encoding());
5232
  emit_int8((unsigned char)0xF7);
5233
  emit_int8((unsigned char)(0xF8 | encode));
5234
}
5235

5236
void Assembler::imulq(Register dst, Register src) {
5237
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5238
  emit_int8(0x0F);
5239
  emit_int8((unsigned char)0xAF);
5240
  emit_int8((unsigned char)(0xC0 | encode));
5241
}
5242

5243
void Assembler::imulq(Register dst, Register src, int value) {
5244
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5245
  if (is8bit(value)) {
5246
    emit_int8(0x6B);
5247
    emit_int8((unsigned char)(0xC0 | encode));
5248
    emit_int8(value & 0xFF);
5249
  } else {
5250
    emit_int8(0x69);
5251
    emit_int8((unsigned char)(0xC0 | encode));
5252
    emit_int32(value);
5253
  }
5254
}
5255

5256
void Assembler::imulq(Register dst, Address src) {
5257
  InstructionMark im(this);
5258
  prefixq(src, dst);
5259
  emit_int8(0x0F);
5260
  emit_int8((unsigned char) 0xAF);
5261
  emit_operand(dst, src);
5262
}
5263

5264
void Assembler::incl(Register dst) {
5265
  // Don't use it directly. Use MacroAssembler::incrementl() instead.
5266
  // Use two-byte form (one-byte from is a REX prefix in 64-bit mode)
5267
  int encode = prefix_and_encode(dst->encoding());
5268
  emit_int8((unsigned char)0xFF);
5269
  emit_int8((unsigned char)(0xC0 | encode));
5270
}
5271

5272
void Assembler::incq(Register dst) {
5273
  // Don't use it directly. Use MacroAssembler::incrementq() instead.
5274
  // Use two-byte form (one-byte from is a REX prefix in 64-bit mode)
5275
  int encode = prefixq_and_encode(dst->encoding());
5276
  emit_int8((unsigned char)0xFF);
5277
  emit_int8((unsigned char)(0xC0 | encode));
5278
}
5279

5280
void Assembler::incq(Address dst) {
5281
  // Don't use it directly. Use MacroAssembler::incrementq() instead.
5282
  InstructionMark im(this);
5283
  prefixq(dst);
5284
  emit_int8((unsigned char)0xFF);
5285
  emit_operand(rax, dst);
5286
}
5287

5288
void Assembler::lea(Register dst, Address src) {
5289
  leaq(dst, src);
5290
}
5291

5292
void Assembler::leaq(Register dst, Address src) {
5293
  InstructionMark im(this);
5294
  prefixq(src, dst);
5295
  emit_int8((unsigned char)0x8D);
5296
  emit_operand(dst, src);
5297
}
5298

5299
void Assembler::mov64(Register dst, int64_t imm64) {
5300
  InstructionMark im(this);
5301
  int encode = prefixq_and_encode(dst->encoding());
5302
  emit_int8((unsigned char)(0xB8 | encode));
5303
  emit_int64(imm64);
5304
}
5305

5306
void Assembler::mov_literal64(Register dst, intptr_t imm64, RelocationHolder const& rspec) {
5307
  InstructionMark im(this);
5308
  int encode = prefixq_and_encode(dst->encoding());
5309
  emit_int8(0xB8 | encode);
5310
  emit_data64(imm64, rspec);
5311
}
5312

5313
void Assembler::mov_narrow_oop(Register dst, int32_t imm32, RelocationHolder const& rspec) {
5314
  InstructionMark im(this);
5315
  int encode = prefix_and_encode(dst->encoding());
5316
  emit_int8((unsigned char)(0xB8 | encode));
5317
  emit_data((int)imm32, rspec, narrow_oop_operand);
5318
}
5319

5320
void Assembler::mov_narrow_oop(Address dst, int32_t imm32,  RelocationHolder const& rspec) {
5321
  InstructionMark im(this);
5322
  prefix(dst);
5323
  emit_int8((unsigned char)0xC7);
5324
  emit_operand(rax, dst, 4);
5325
  emit_data((int)imm32, rspec, narrow_oop_operand);
5326
}
5327

5328
void Assembler::cmp_narrow_oop(Register src1, int32_t imm32, RelocationHolder const& rspec) {
5329
  InstructionMark im(this);
5330
  int encode = prefix_and_encode(src1->encoding());
5331
  emit_int8((unsigned char)0x81);
5332
  emit_int8((unsigned char)(0xF8 | encode));
5333
  emit_data((int)imm32, rspec, narrow_oop_operand);
5334
}
5335

5336
void Assembler::cmp_narrow_oop(Address src1, int32_t imm32, RelocationHolder const& rspec) {
5337
  InstructionMark im(this);
5338
  prefix(src1);
5339
  emit_int8((unsigned char)0x81);
5340
  emit_operand(rax, src1, 4);
5341
  emit_data((int)imm32, rspec, narrow_oop_operand);
5342
}
5343

5344
void Assembler::lzcntq(Register dst, Register src) {
5345
  assert(VM_Version::supports_lzcnt(), "encoding is treated as BSR");
5346
  emit_int8((unsigned char)0xF3);
5347
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5348
  emit_int8(0x0F);
5349
  emit_int8((unsigned char)0xBD);
5350
  emit_int8((unsigned char)(0xC0 | encode));
5351
}
5352

5353
void Assembler::movdq(XMMRegister dst, Register src) {
5354
  // table D-1 says MMX/SSE2
5355
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
5356
  int encode = simd_prefix_and_encode_q(dst, src, VEX_SIMD_66);
5357
  emit_int8(0x6E);
5358
  emit_int8((unsigned char)(0xC0 | encode));
5359
}
5360

5361
void Assembler::movdq(Register dst, XMMRegister src) {
5362
  // table D-1 says MMX/SSE2
5363
  NOT_LP64(assert(VM_Version::supports_sse2(), ""));
5364
  // swap src/dst to get correct prefix
5365
  int encode = simd_prefix_and_encode_q(src, dst, VEX_SIMD_66);
5366
  emit_int8(0x7E);
5367
  emit_int8((unsigned char)(0xC0 | encode));
5368
}
5369

5370
void Assembler::movq(Register dst, Register src) {
5371
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5372
  emit_int8((unsigned char)0x8B);
5373
  emit_int8((unsigned char)(0xC0 | encode));
5374
}
5375

5376
void Assembler::movq(Register dst, Address src) {
5377
  InstructionMark im(this);
5378
  prefixq(src, dst);
5379
  emit_int8((unsigned char)0x8B);
5380
  emit_operand(dst, src);
5381
}
5382

5383
void Assembler::movq(Address dst, Register src) {
5384
  InstructionMark im(this);
5385
  prefixq(dst, src);
5386
  emit_int8((unsigned char)0x89);
5387
  emit_operand(src, dst);
5388
}
5389

5390
void Assembler::movsbq(Register dst, Address src) {
5391
  InstructionMark im(this);
5392
  prefixq(src, dst);
5393
  emit_int8(0x0F);
5394
  emit_int8((unsigned char)0xBE);
5395
  emit_operand(dst, src);
5396
}
5397

5398
void Assembler::movsbq(Register dst, Register src) {
5399
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5400
  emit_int8(0x0F);
5401
  emit_int8((unsigned char)0xBE);
5402
  emit_int8((unsigned char)(0xC0 | encode));
5403
}
5404

5405
void Assembler::movslq(Register dst, int32_t imm32) {
5406
  // dbx shows movslq(rcx, 3) as movq     $0x0000000049000000,(%rbx)
5407
  // and movslq(r8, 3); as movl     $0x0000000048000000,(%rbx)
5408
  // as a result we shouldn't use until tested at runtime...
5409
  ShouldNotReachHere();
5410
  InstructionMark im(this);
5411
  int encode = prefixq_and_encode(dst->encoding());
5412
  emit_int8((unsigned char)(0xC7 | encode));
5413
  emit_int32(imm32);
5414
}
5415

5416
void Assembler::movslq(Address dst, int32_t imm32) {
5417
  assert(is_simm32(imm32), "lost bits");
5418
  InstructionMark im(this);
5419
  prefixq(dst);
5420
  emit_int8((unsigned char)0xC7);
5421
  emit_operand(rax, dst, 4);
5422
  emit_int32(imm32);
5423
}
5424

5425
void Assembler::movslq(Register dst, Address src) {
5426
  InstructionMark im(this);
5427
  prefixq(src, dst);
5428
  emit_int8(0x63);
5429
  emit_operand(dst, src);
5430
}
5431

5432
void Assembler::movslq(Register dst, Register src) {
5433
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5434
  emit_int8(0x63);
5435
  emit_int8((unsigned char)(0xC0 | encode));
5436
}
5437

5438
void Assembler::movswq(Register dst, Address src) {
5439
  InstructionMark im(this);
5440
  prefixq(src, dst);
5441
  emit_int8(0x0F);
5442
  emit_int8((unsigned char)0xBF);
5443
  emit_operand(dst, src);
5444
}
5445

5446
void Assembler::movswq(Register dst, Register src) {
5447
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5448
  emit_int8((unsigned char)0x0F);
5449
  emit_int8((unsigned char)0xBF);
5450
  emit_int8((unsigned char)(0xC0 | encode));
5451
}
5452

5453
void Assembler::movzbq(Register dst, Address src) {
5454
  InstructionMark im(this);
5455
  prefixq(src, dst);
5456
  emit_int8((unsigned char)0x0F);
5457
  emit_int8((unsigned char)0xB6);
5458
  emit_operand(dst, src);
5459
}
5460

5461
void Assembler::movzbq(Register dst, Register src) {
5462
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5463
  emit_int8(0x0F);
5464
  emit_int8((unsigned char)0xB6);
5465
  emit_int8(0xC0 | encode);
5466
}
5467

5468
void Assembler::movzwq(Register dst, Address src) {
5469
  InstructionMark im(this);
5470
  prefixq(src, dst);
5471
  emit_int8((unsigned char)0x0F);
5472
  emit_int8((unsigned char)0xB7);
5473
  emit_operand(dst, src);
5474
}
5475

5476
void Assembler::movzwq(Register dst, Register src) {
5477
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5478
  emit_int8((unsigned char)0x0F);
5479
  emit_int8((unsigned char)0xB7);
5480
  emit_int8((unsigned char)(0xC0 | encode));
5481
}
5482

5483
void Assembler::mulq(Address src) {
5484
  InstructionMark im(this);
5485
  prefixq(src);
5486
  emit_int8((unsigned char)0xF7);
5487
  emit_operand(rsp, src);
5488
}
5489

5490
void Assembler::mulq(Register src) {
5491
  int encode = prefixq_and_encode(src->encoding());
5492
  emit_int8((unsigned char)0xF7);
5493
  emit_int8((unsigned char)(0xE0 | encode));
5494
}
5495

5496
void Assembler::mulxq(Register dst1, Register dst2, Register src) {
5497
  assert(VM_Version::supports_bmi2(), "bit manipulation instructions not supported");
5498
  int encode = vex_prefix_and_encode(dst1->encoding(), dst2->encoding(), src->encoding(), VEX_SIMD_F2, VEX_OPCODE_0F_38, true, false);
5499
  emit_int8((unsigned char)0xF6);
5500
  emit_int8((unsigned char)(0xC0 | encode));
5501
}
5502

5503
void Assembler::negq(Register dst) {
5504
  int encode = prefixq_and_encode(dst->encoding());
5505
  emit_int8((unsigned char)0xF7);
5506
  emit_int8((unsigned char)(0xD8 | encode));
5507
}
5508

5509
void Assembler::notq(Register dst) {
5510
  int encode = prefixq_and_encode(dst->encoding());
5511
  emit_int8((unsigned char)0xF7);
5512
  emit_int8((unsigned char)(0xD0 | encode));
5513
}
5514

5515
void Assembler::orq(Address dst, int32_t imm32) {
5516
  InstructionMark im(this);
5517
  prefixq(dst);
5518
  emit_int8((unsigned char)0x81);
5519
  emit_operand(rcx, dst, 4);
5520
  emit_int32(imm32);
5521
}
5522

5523
void Assembler::orq(Register dst, int32_t imm32) {
5524
  (void) prefixq_and_encode(dst->encoding());
5525
  emit_arith(0x81, 0xC8, dst, imm32);
5526
}
5527

5528
void Assembler::orq(Register dst, Address src) {
5529
  InstructionMark im(this);
5530
  prefixq(src, dst);
5531
  emit_int8(0x0B);
5532
  emit_operand(dst, src);
5533
}
5534

5535
void Assembler::orq(Register dst, Register src) {
5536
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5537
  emit_arith(0x0B, 0xC0, dst, src);
5538
}
5539

5540
void Assembler::popa() { // 64bit
5541
  movq(r15, Address(rsp, 0));
5542
  movq(r14, Address(rsp, wordSize));
5543
  movq(r13, Address(rsp, 2 * wordSize));
5544
  movq(r12, Address(rsp, 3 * wordSize));
5545
  movq(r11, Address(rsp, 4 * wordSize));
5546
  movq(r10, Address(rsp, 5 * wordSize));
5547
  movq(r9,  Address(rsp, 6 * wordSize));
5548
  movq(r8,  Address(rsp, 7 * wordSize));
5549
  movq(rdi, Address(rsp, 8 * wordSize));
5550
  movq(rsi, Address(rsp, 9 * wordSize));
5551
  movq(rbp, Address(rsp, 10 * wordSize));
5552
  // skip rsp
5553
  movq(rbx, Address(rsp, 12 * wordSize));
5554
  movq(rdx, Address(rsp, 13 * wordSize));
5555
  movq(rcx, Address(rsp, 14 * wordSize));
5556
  movq(rax, Address(rsp, 15 * wordSize));
5557

5558
  addq(rsp, 16 * wordSize);
5559
}
5560

5561
void Assembler::popcntq(Register dst, Address src) {
5562
  assert(VM_Version::supports_popcnt(), "must support");
5563
  InstructionMark im(this);
5564
  emit_int8((unsigned char)0xF3);
5565
  prefixq(src, dst);
5566
  emit_int8((unsigned char)0x0F);
5567
  emit_int8((unsigned char)0xB8);
5568
  emit_operand(dst, src);
5569
}
5570

5571
void Assembler::popcntq(Register dst, Register src) {
5572
  assert(VM_Version::supports_popcnt(), "must support");
5573
  emit_int8((unsigned char)0xF3);
5574
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5575
  emit_int8((unsigned char)0x0F);
5576
  emit_int8((unsigned char)0xB8);
5577
  emit_int8((unsigned char)(0xC0 | encode));
5578
}
5579

5580
void Assembler::popq(Address dst) {
5581
  InstructionMark im(this);
5582
  prefixq(dst);
5583
  emit_int8((unsigned char)0x8F);
5584
  emit_operand(rax, dst);
5585
}
5586

5587
void Assembler::pusha() { // 64bit
5588
  // we have to store original rsp.  ABI says that 128 bytes
5589
  // below rsp are local scratch.
5590
  movq(Address(rsp, -5 * wordSize), rsp);
5591

5592
  subq(rsp, 16 * wordSize);
5593

5594
  movq(Address(rsp, 15 * wordSize), rax);
5595
  movq(Address(rsp, 14 * wordSize), rcx);
5596
  movq(Address(rsp, 13 * wordSize), rdx);
5597
  movq(Address(rsp, 12 * wordSize), rbx);
5598
  // skip rsp
5599
  movq(Address(rsp, 10 * wordSize), rbp);
5600
  movq(Address(rsp, 9 * wordSize), rsi);
5601
  movq(Address(rsp, 8 * wordSize), rdi);
5602
  movq(Address(rsp, 7 * wordSize), r8);
5603
  movq(Address(rsp, 6 * wordSize), r9);
5604
  movq(Address(rsp, 5 * wordSize), r10);
5605
  movq(Address(rsp, 4 * wordSize), r11);
5606
  movq(Address(rsp, 3 * wordSize), r12);
5607
  movq(Address(rsp, 2 * wordSize), r13);
5608
  movq(Address(rsp, wordSize), r14);
5609
  movq(Address(rsp, 0), r15);
5610
}
5611

5612
void Assembler::pushq(Address src) {
5613
  InstructionMark im(this);
5614
  prefixq(src);
5615
  emit_int8((unsigned char)0xFF);
5616
  emit_operand(rsi, src);
5617
}
5618

5619
void Assembler::rclq(Register dst, int imm8) {
5620
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5621
  int encode = prefixq_and_encode(dst->encoding());
5622
  if (imm8 == 1) {
5623
    emit_int8((unsigned char)0xD1);
5624
    emit_int8((unsigned char)(0xD0 | encode));
5625
  } else {
5626
    emit_int8((unsigned char)0xC1);
5627
    emit_int8((unsigned char)(0xD0 | encode));
5628
    emit_int8(imm8);
5629
  }
5630
}
5631

5632
void Assembler::rcrq(Register dst, int imm8) {
5633
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5634
  int encode = prefixq_and_encode(dst->encoding());
5635
  if (imm8 == 1) {
5636
    emit_int8((unsigned char)0xD1);
5637
    emit_int8((unsigned char)(0xD8 | encode));
5638
  } else {
5639
    emit_int8((unsigned char)0xC1);
5640
    emit_int8((unsigned char)(0xD8 | encode));
5641
    emit_int8(imm8);
5642
  }
5643
}
5644

5645
void Assembler::rorq(Register dst, int imm8) {
5646
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5647
  int encode = prefixq_and_encode(dst->encoding());
5648
  if (imm8 == 1) {
5649
    emit_int8((unsigned char)0xD1);
5650
    emit_int8((unsigned char)(0xC8 | encode));
5651
  } else {
5652
    emit_int8((unsigned char)0xC1);
5653
    emit_int8((unsigned char)(0xc8 | encode));
5654
    emit_int8(imm8);
5655
  }
5656
}
5657

5658
void Assembler::rorxq(Register dst, Register src, int imm8) {
5659
  assert(VM_Version::supports_bmi2(), "bit manipulation instructions not supported");
5660
  int encode = vex_prefix_and_encode(dst->encoding(), 0, src->encoding(), VEX_SIMD_F2, VEX_OPCODE_0F_3A, true, false);
5661
  emit_int8((unsigned char)0xF0);
5662
  emit_int8((unsigned char)(0xC0 | encode));
5663
  emit_int8(imm8);
5664
}
5665

5666
void Assembler::sarq(Register dst, int imm8) {
5667
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5668
  int encode = prefixq_and_encode(dst->encoding());
5669
  if (imm8 == 1) {
5670
    emit_int8((unsigned char)0xD1);
5671
    emit_int8((unsigned char)(0xF8 | encode));
5672
  } else {
5673
    emit_int8((unsigned char)0xC1);
5674
    emit_int8((unsigned char)(0xF8 | encode));
5675
    emit_int8(imm8);
5676
  }
5677
}
5678

5679
void Assembler::sarq(Register dst) {
5680
  int encode = prefixq_and_encode(dst->encoding());
5681
  emit_int8((unsigned char)0xD3);
5682
  emit_int8((unsigned char)(0xF8 | encode));
5683
}
5684

5685
void Assembler::sbbq(Address dst, int32_t imm32) {
5686
  InstructionMark im(this);
5687
  prefixq(dst);
5688
  emit_arith_operand(0x81, rbx, dst, imm32);
5689
}
5690

5691
void Assembler::sbbq(Register dst, int32_t imm32) {
5692
  (void) prefixq_and_encode(dst->encoding());
5693
  emit_arith(0x81, 0xD8, dst, imm32);
5694
}
5695

5696
void Assembler::sbbq(Register dst, Address src) {
5697
  InstructionMark im(this);
5698
  prefixq(src, dst);
5699
  emit_int8(0x1B);
5700
  emit_operand(dst, src);
5701
}
5702

5703
void Assembler::sbbq(Register dst, Register src) {
5704
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5705
  emit_arith(0x1B, 0xC0, dst, src);
5706
}
5707

5708
void Assembler::shlq(Register dst, int imm8) {
5709
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5710
  int encode = prefixq_and_encode(dst->encoding());
5711
  if (imm8 == 1) {
5712
    emit_int8((unsigned char)0xD1);
5713
    emit_int8((unsigned char)(0xE0 | encode));
5714
  } else {
5715
    emit_int8((unsigned char)0xC1);
5716
    emit_int8((unsigned char)(0xE0 | encode));
5717
    emit_int8(imm8);
5718
  }
5719
}
5720

5721
void Assembler::shlq(Register dst) {
5722
  int encode = prefixq_and_encode(dst->encoding());
5723
  emit_int8((unsigned char)0xD3);
5724
  emit_int8((unsigned char)(0xE0 | encode));
5725
}
5726

5727
void Assembler::shrq(Register dst, int imm8) {
5728
  assert(isShiftCount(imm8 >> 1), "illegal shift count");
5729
  int encode = prefixq_and_encode(dst->encoding());
5730
  emit_int8((unsigned char)0xC1);
5731
  emit_int8((unsigned char)(0xE8 | encode));
5732
  emit_int8(imm8);
5733
}
5734

5735
void Assembler::shrq(Register dst) {
5736
  int encode = prefixq_and_encode(dst->encoding());
5737
  emit_int8((unsigned char)0xD3);
5738
  emit_int8(0xE8 | encode);
5739
}
5740

5741
void Assembler::subq(Address dst, int32_t imm32) {
5742
  InstructionMark im(this);
5743
  prefixq(dst);
5744
  emit_arith_operand(0x81, rbp, dst, imm32);
5745
}
5746

5747
void Assembler::subq(Address dst, Register src) {
5748
  InstructionMark im(this);
5749
  prefixq(dst, src);
5750
  emit_int8(0x29);
5751
  emit_operand(src, dst);
5752
}
5753

5754
void Assembler::subq(Register dst, int32_t imm32) {
5755
  (void) prefixq_and_encode(dst->encoding());
5756
  emit_arith(0x81, 0xE8, dst, imm32);
5757
}
5758

5759
// Force generation of a 4 byte immediate value even if it fits into 8bit
5760
void Assembler::subq_imm32(Register dst, int32_t imm32) {
5761
  (void) prefixq_and_encode(dst->encoding());
5762
  emit_arith_imm32(0x81, 0xE8, dst, imm32);
5763
}
5764

5765
void Assembler::subq(Register dst, Address src) {
5766
  InstructionMark im(this);
5767
  prefixq(src, dst);
5768
  emit_int8(0x2B);
5769
  emit_operand(dst, src);
5770
}
5771

5772
void Assembler::subq(Register dst, Register src) {
5773
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5774
  emit_arith(0x2B, 0xC0, dst, src);
5775
}
5776

5777
void Assembler::testq(Register dst, int32_t imm32) {
5778
  // not using emit_arith because test
5779
  // doesn't support sign-extension of
5780
  // 8bit operands
5781
  int encode = dst->encoding();
5782
  if (encode == 0) {
5783
    prefix(REX_W);
5784
    emit_int8((unsigned char)0xA9);
5785
  } else {
5786
    encode = prefixq_and_encode(encode);
5787
    emit_int8((unsigned char)0xF7);
5788
    emit_int8((unsigned char)(0xC0 | encode));
5789
  }
5790
  emit_int32(imm32);
5791
}
5792

5793
void Assembler::testq(Register dst, Register src) {
5794
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5795
  emit_arith(0x85, 0xC0, dst, src);
5796
}
5797

5798
void Assembler::xaddq(Address dst, Register src) {
5799
  InstructionMark im(this);
5800
  prefixq(dst, src);
5801
  emit_int8(0x0F);
5802
  emit_int8((unsigned char)0xC1);
5803
  emit_operand(src, dst);
5804
}
5805

5806
void Assembler::xchgq(Register dst, Address src) {
5807
  InstructionMark im(this);
5808
  prefixq(src, dst);
5809
  emit_int8((unsigned char)0x87);
5810
  emit_operand(dst, src);
5811
}
5812

5813
void Assembler::xchgq(Register dst, Register src) {
5814
  int encode = prefixq_and_encode(dst->encoding(), src->encoding());
5815
  emit_int8((unsigned char)0x87);
5816
  emit_int8((unsigned char)(0xc0 | encode));
5817
}
5818

5819
void Assembler::xorq(Register dst, Register src) {
5820
  (void) prefixq_and_encode(dst->encoding(), src->encoding());
5821
  emit_arith(0x33, 0xC0, dst, src);
5822
}
5823

5824
void Assembler::xorq(Register dst, Address src) {
5825
  InstructionMark im(this);
5826
  prefixq(src, dst);
5827
  emit_int8(0x33);
5828
  emit_operand(dst, src);
5829
}
5830

5831
#endif // !LP64
5832

5833
Product

Resources

Company