src/hotspot/cpu/ppc/macroAssembler_ppc.cpp
author coleenp
Tue, 03 Oct 2017 16:42:04 -0400
changeset 47580 96392e113a0a
parent 47521 122833427b36
child 48332 651a95f30dfb
permissions -rw-r--r--
8186777: Make Klass::_java_mirror an OopHandle Summary: Add indirection for fetching mirror so that GC doesn't have to follow CLD::_klasses Reviewed-by: hseigel, thartmann, eosterlund, stefank Contributed-by: coleen.phillimore@oracle.com, rickard.backman@oracle.com
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     1
/*
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
     2
 * Copyright (c) 1997, 2017, Oracle and/or its affiliates. All rights reserved.
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
     3
 * Copyright (c) 2012, 2017, SAP SE. All rights reserved.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     4
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     5
 *
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     6
 * This code is free software; you can redistribute it and/or modify it
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     7
 * under the terms of the GNU General Public License version 2 only, as
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     8
 * published by the Free Software Foundation.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
     9
 *
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    10
 * This code is distributed in the hope that it will be useful, but WITHOUT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    11
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    12
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    13
 * version 2 for more details (a copy is included in the LICENSE file that
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    14
 * accompanied this code).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    15
 *
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    16
 * You should have received a copy of the GNU General Public License version
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    17
 * 2 along with this work; if not, write to the Free Software Foundation,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    18
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    19
 *
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    20
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    21
 * or visit www.oracle.com if you need additional information or have any
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    22
 * questions.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    23
 *
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    24
 */
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    25
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    26
#include "precompiled.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    27
#include "asm/macroAssembler.inline.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    28
#include "compiler/disassembler.hpp"
30764
fec48bf5a827 8079792: GC directory structure cleanup
pliden
parents: 30303
diff changeset
    29
#include "gc/shared/cardTableModRefBS.hpp"
fec48bf5a827 8079792: GC directory structure cleanup
pliden
parents: 30303
diff changeset
    30
#include "gc/shared/collectedHeap.inline.hpp"
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    31
#include "interpreter/interpreter.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    32
#include "memory/resourceArea.hpp"
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
    33
#include "nativeInst_ppc.hpp"
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    34
#include "prims/methodHandles.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    35
#include "runtime/biasedLocking.hpp"
25715
d5a8dbdc5150 8049325: Introduce and clean up umbrella headers for the files in the cpu subdirectories.
goetz
parents: 25374
diff changeset
    36
#include "runtime/icache.hpp"
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    37
#include "runtime/interfaceSupport.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    38
#include "runtime/objectMonitor.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    39
#include "runtime/os.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    40
#include "runtime/sharedRuntime.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    41
#include "runtime/stubRoutines.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    42
#include "utilities/macros.hpp"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    43
#if INCLUDE_ALL_GCS
30764
fec48bf5a827 8079792: GC directory structure cleanup
pliden
parents: 30303
diff changeset
    44
#include "gc/g1/g1CollectedHeap.inline.hpp"
fec48bf5a827 8079792: GC directory structure cleanup
pliden
parents: 30303
diff changeset
    45
#include "gc/g1/g1SATBCardTableModRefBS.hpp"
fec48bf5a827 8079792: GC directory structure cleanup
pliden
parents: 30303
diff changeset
    46
#include "gc/g1/heapRegion.hpp"
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    47
#endif // INCLUDE_ALL_GCS
36303
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
    48
#ifdef COMPILER2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
    49
#include "opto/intrinsicnode.hpp"
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
    50
#endif
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    51
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    52
#ifdef PRODUCT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    53
#define BLOCK_COMMENT(str) // nothing
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    54
#else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    55
#define BLOCK_COMMENT(str) block_comment(str)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    56
#endif
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
    57
#define BIND(label) bind(label); BLOCK_COMMENT(#label ":")
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    58
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    59
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    60
// On RISC, there's no benefit to verifying instruction boundaries.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    61
bool AbstractAssembler::pd_check_instruction_mark() { return false; }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    62
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    63
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    64
void MacroAssembler::ld_largeoffset_unchecked(Register d, int si31, Register a, int emit_filler_nop) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    65
  assert(Assembler::is_simm(si31, 31) && si31 >= 0, "si31 out of range");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    66
  if (Assembler::is_simm(si31, 16)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    67
    ld(d, si31, a);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    68
    if (emit_filler_nop) nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    69
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    70
    const int hi = MacroAssembler::largeoffset_si16_si16_hi(si31);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    71
    const int lo = MacroAssembler::largeoffset_si16_si16_lo(si31);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    72
    addis(d, a, hi);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    73
    ld(d, lo, d);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    74
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    75
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    76
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    77
void MacroAssembler::ld_largeoffset(Register d, int si31, Register a, int emit_filler_nop) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    78
  assert_different_registers(d, a);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    79
  ld_largeoffset_unchecked(d, si31, a, emit_filler_nop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    80
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    81
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    82
void MacroAssembler::load_sized_value(Register dst, RegisterOrConstant offs, Register base,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    83
                                      size_t size_in_bytes, bool is_signed) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    84
  switch (size_in_bytes) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    85
  case  8:              ld(dst, offs, base);                         break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    86
  case  4:  is_signed ? lwa(dst, offs, base) : lwz(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    87
  case  2:  is_signed ? lha(dst, offs, base) : lhz(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    88
  case  1:  lbz(dst, offs, base); if (is_signed) extsb(dst, dst);    break; // lba doesn't exist :(
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    89
  default:  ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    90
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    91
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    92
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    93
void MacroAssembler::store_sized_value(Register dst, RegisterOrConstant offs, Register base,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    94
                                       size_t size_in_bytes) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    95
  switch (size_in_bytes) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    96
  case  8:  std(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    97
  case  4:  stw(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    98
  case  2:  sth(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
    99
  case  1:  stb(dst, offs, base); break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   100
  default:  ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   101
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   102
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   103
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   104
void MacroAssembler::align(int modulus, int max, int rem) {
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   105
  int padding = (rem + modulus - (offset() % modulus)) % modulus;
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   106
  if (padding > max) return;
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   107
  for (int c = (padding >> 2); c > 0; --c) { nop(); }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   108
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   109
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   110
// Issue instructions that calculate given TOC from global TOC.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   111
void MacroAssembler::calculate_address_from_global_toc(Register dst, address addr, bool hi16, bool lo16,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   112
                                                       bool add_relocation, bool emit_dummy_addr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   113
  int offset = -1;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   114
  if (emit_dummy_addr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   115
    offset = -128; // dummy address
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   116
  } else if (addr != (address)(intptr_t)-1) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   117
    offset = MacroAssembler::offset_to_global_toc(addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   118
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   119
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   120
  if (hi16) {
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   121
    addis(dst, R29_TOC, MacroAssembler::largeoffset_si16_si16_hi(offset));
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   122
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   123
  if (lo16) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   124
    if (add_relocation) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   125
      // Relocate at the addi to avoid confusion with a load from the method's TOC.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   126
      relocate(internal_word_Relocation::spec(addr));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   127
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   128
    addi(dst, dst, MacroAssembler::largeoffset_si16_si16_lo(offset));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   129
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   130
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   131
47520
50790528dd25 8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents: 47216
diff changeset
   132
address MacroAssembler::patch_calculate_address_from_global_toc_at(address a, address bound, address addr) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   133
  const int offset = MacroAssembler::offset_to_global_toc(addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   134
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   135
  const address inst2_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   136
  const int inst2 = *(int *)inst2_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   137
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   138
  // The relocation points to the second instruction, the addi,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   139
  // and the addi reads and writes the same register dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   140
  const int dst = inv_rt_field(inst2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   141
  assert(is_addi(inst2) && inv_ra_field(inst2) == dst, "must be addi reading and writing dst");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   142
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   143
  // Now, find the preceding addis which writes to dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   144
  int inst1 = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   145
  address inst1_addr = inst2_addr - BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   146
  while (inst1_addr >= bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   147
    inst1 = *(int *) inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   148
    if (is_addis(inst1) && inv_rt_field(inst1) == dst) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   149
      // Stop, found the addis which writes dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   150
      break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   151
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   152
    inst1_addr -= BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   153
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   154
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   155
  assert(is_addis(inst1) && inv_ra_field(inst1) == 29 /* R29 */, "source must be global TOC");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   156
  set_imm((int *)inst1_addr, MacroAssembler::largeoffset_si16_si16_hi(offset));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   157
  set_imm((int *)inst2_addr, MacroAssembler::largeoffset_si16_si16_lo(offset));
47520
50790528dd25 8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents: 47216
diff changeset
   158
  return inst1_addr;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   159
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   160
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   161
address MacroAssembler::get_address_of_calculate_address_from_global_toc_at(address a, address bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   162
  const address inst2_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   163
  const int inst2 = *(int *)inst2_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   164
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   165
  // The relocation points to the second instruction, the addi,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   166
  // and the addi reads and writes the same register dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   167
  const int dst = inv_rt_field(inst2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   168
  assert(is_addi(inst2) && inv_ra_field(inst2) == dst, "must be addi reading and writing dst");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   169
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   170
  // Now, find the preceding addis which writes to dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   171
  int inst1 = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   172
  address inst1_addr = inst2_addr - BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   173
  while (inst1_addr >= bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   174
    inst1 = *(int *) inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   175
    if (is_addis(inst1) && inv_rt_field(inst1) == dst) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   176
      // stop, found the addis which writes dst
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   177
      break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   178
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   179
    inst1_addr -= BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   180
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   181
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   182
  assert(is_addis(inst1) && inv_ra_field(inst1) == 29 /* R29 */, "source must be global TOC");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   183
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   184
  int offset = (get_imm(inst1_addr, 0) << 16) + get_imm(inst2_addr, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   185
  // -1 is a special case
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   186
  if (offset == -1) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   187
    return (address)(intptr_t)-1;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   188
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   189
    return global_toc() + offset;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   190
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   191
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   192
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   193
#ifdef _LP64
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   194
// Patch compressed oops or klass constants.
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   195
// Assembler sequence is
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   196
// 1) compressed oops:
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   197
//    lis  rx = const.hi
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   198
//    ori rx = rx | const.lo
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   199
// 2) compressed klass:
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   200
//    lis  rx = const.hi
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   201
//    clrldi rx = rx & 0xFFFFffff // clearMS32b, optional
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   202
//    ori rx = rx | const.lo
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   203
// Clrldi will be passed by.
47520
50790528dd25 8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents: 47216
diff changeset
   204
address MacroAssembler::patch_set_narrow_oop(address a, address bound, narrowOop data) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   205
  assert(UseCompressedOops, "Should only patch compressed oops");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   206
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   207
  const address inst2_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   208
  const int inst2 = *(int *)inst2_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   209
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   210
  // The relocation points to the second instruction, the ori,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   211
  // and the ori reads and writes the same register dst.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   212
  const int dst = inv_rta_field(inst2);
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
   213
  assert(is_ori(inst2) && inv_rs_field(inst2) == dst, "must be ori reading and writing dst");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   214
  // Now, find the preceding addis which writes to dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   215
  int inst1 = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   216
  address inst1_addr = inst2_addr - BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   217
  bool inst1_found = false;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   218
  while (inst1_addr >= bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   219
    inst1 = *(int *)inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   220
    if (is_lis(inst1) && inv_rs_field(inst1) == dst) { inst1_found = true; break; }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   221
    inst1_addr -= BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   222
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   223
  assert(inst1_found, "inst is not lis");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   224
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   225
  int xc = (data >> 16) & 0xffff;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   226
  int xd = (data >>  0) & 0xffff;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   227
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   228
  set_imm((int *)inst1_addr, (short)(xc)); // see enc_load_con_narrow_hi/_lo
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
   229
  set_imm((int *)inst2_addr,        (xd)); // unsigned int
47520
50790528dd25 8187547: PPC64: icache invalidation is incorrect in some places
goetz
parents: 47216
diff changeset
   230
  return inst1_addr;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   231
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   232
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   233
// Get compressed oop or klass constant.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   234
narrowOop MacroAssembler::get_narrow_oop(address a, address bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   235
  assert(UseCompressedOops, "Should only patch compressed oops");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   236
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   237
  const address inst2_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   238
  const int inst2 = *(int *)inst2_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   239
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   240
  // The relocation points to the second instruction, the ori,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   241
  // and the ori reads and writes the same register dst.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   242
  const int dst = inv_rta_field(inst2);
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
   243
  assert(is_ori(inst2) && inv_rs_field(inst2) == dst, "must be ori reading and writing dst");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   244
  // Now, find the preceding lis which writes to dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   245
  int inst1 = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   246
  address inst1_addr = inst2_addr - BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   247
  bool inst1_found = false;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   248
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   249
  while (inst1_addr >= bound) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   250
    inst1 = *(int *) inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   251
    if (is_lis(inst1) && inv_rs_field(inst1) == dst) { inst1_found = true; break;}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   252
    inst1_addr -= BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   253
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   254
  assert(inst1_found, "inst is not lis");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   255
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   256
  uint xl = ((unsigned int) (get_imm(inst2_addr, 0) & 0xffff));
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   257
  uint xh = (((get_imm(inst1_addr, 0)) & 0xffff) << 16);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   258
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   259
  return (int) (xl | xh);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   260
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   261
#endif // _LP64
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   262
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   263
// Returns true if successful.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   264
bool MacroAssembler::load_const_from_method_toc(Register dst, AddressLiteral& a,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   265
                                                Register toc, bool fixed_size) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   266
  int toc_offset = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   267
  // Use RelocationHolder::none for the constant pool entry, otherwise
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   268
  // we will end up with a failing NativeCall::verify(x) where x is
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   269
  // the address of the constant pool entry.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   270
  // FIXME: We should insert relocation information for oops at the constant
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   271
  // pool entries instead of inserting it at the loads; patching of a constant
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   272
  // pool entry should be less expensive.
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   273
  address const_address = address_constant((address)a.value(), RelocationHolder::none);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   274
  if (const_address == NULL) { return false; } // allocation failure
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   275
  // Relocate at the pc of the load.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   276
  relocate(a.rspec());
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   277
  toc_offset = (int)(const_address - code()->consts()->start());
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   278
  ld_largeoffset_unchecked(dst, toc_offset, toc, fixed_size);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   279
  return true;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   280
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   281
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   282
bool MacroAssembler::is_load_const_from_method_toc_at(address a) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   283
  const address inst1_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   284
  const int inst1 = *(int *)inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   285
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   286
   // The relocation points to the ld or the addis.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   287
   return (is_ld(inst1)) ||
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   288
          (is_addis(inst1) && inv_ra_field(inst1) != 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   289
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   290
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   291
int MacroAssembler::get_offset_of_load_const_from_method_toc_at(address a) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   292
  assert(is_load_const_from_method_toc_at(a), "must be load_const_from_method_toc");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   293
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   294
  const address inst1_addr = a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   295
  const int inst1 = *(int *)inst1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   296
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   297
  if (is_ld(inst1)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   298
    return inv_d1_field(inst1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   299
  } else if (is_addis(inst1)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   300
    const int dst = inv_rt_field(inst1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   301
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   302
    // Now, find the succeeding ld which reads and writes to dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   303
    address inst2_addr = inst1_addr + BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   304
    int inst2 = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   305
    while (true) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   306
      inst2 = *(int *) inst2_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   307
      if (is_ld(inst2) && inv_ra_field(inst2) == dst && inv_rt_field(inst2) == dst) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   308
        // Stop, found the ld which reads and writes dst.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   309
        break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   310
      }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   311
      inst2_addr += BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   312
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   313
    return (inv_d1_field(inst1) << 16) + inv_d1_field(inst2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   314
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   315
  ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   316
  return 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   317
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   318
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   319
// Get the constant from a `load_const' sequence.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   320
long MacroAssembler::get_const(address a) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   321
  assert(is_load_const_at(a), "not a load of a constant");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   322
  const int *p = (const int*) a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   323
  unsigned long x = (((unsigned long) (get_imm(a,0) & 0xffff)) << 48);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   324
  if (is_ori(*(p+1))) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   325
    x |= (((unsigned long) (get_imm(a,1) & 0xffff)) << 32);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   326
    x |= (((unsigned long) (get_imm(a,3) & 0xffff)) << 16);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   327
    x |= (((unsigned long) (get_imm(a,4) & 0xffff)));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   328
  } else if (is_lis(*(p+1))) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   329
    x |= (((unsigned long) (get_imm(a,2) & 0xffff)) << 32);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   330
    x |= (((unsigned long) (get_imm(a,1) & 0xffff)) << 16);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   331
    x |= (((unsigned long) (get_imm(a,3) & 0xffff)));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   332
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   333
    ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   334
    return (long) 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   335
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   336
  return (long) x;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   337
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   338
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   339
// Patch the 64 bit constant of a `load_const' sequence. This is a low
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   340
// level procedure. It neither flushes the instruction cache nor is it
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   341
// mt safe.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   342
void MacroAssembler::patch_const(address a, long x) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   343
  assert(is_load_const_at(a), "not a load of a constant");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   344
  int *p = (int*) a;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   345
  if (is_ori(*(p+1))) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   346
    set_imm(0 + p, (x >> 48) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   347
    set_imm(1 + p, (x >> 32) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   348
    set_imm(3 + p, (x >> 16) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   349
    set_imm(4 + p, x & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   350
  } else if (is_lis(*(p+1))) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   351
    set_imm(0 + p, (x >> 48) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   352
    set_imm(2 + p, (x >> 32) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   353
    set_imm(1 + p, (x >> 16) & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   354
    set_imm(3 + p, x & 0xffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   355
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   356
    ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   357
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   358
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   359
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   360
AddressLiteral MacroAssembler::allocate_metadata_address(Metadata* obj) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   361
  assert(oop_recorder() != NULL, "this assembler needs a Recorder");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   362
  int index = oop_recorder()->allocate_metadata_index(obj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   363
  RelocationHolder rspec = metadata_Relocation::spec(index);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   364
  return AddressLiteral((address)obj, rspec);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   365
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   366
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   367
AddressLiteral MacroAssembler::constant_metadata_address(Metadata* obj) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   368
  assert(oop_recorder() != NULL, "this assembler needs a Recorder");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   369
  int index = oop_recorder()->find_index(obj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   370
  RelocationHolder rspec = metadata_Relocation::spec(index);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   371
  return AddressLiteral((address)obj, rspec);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   372
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   373
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   374
AddressLiteral MacroAssembler::allocate_oop_address(jobject obj) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   375
  assert(oop_recorder() != NULL, "this assembler needs an OopRecorder");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   376
  int oop_index = oop_recorder()->allocate_oop_index(obj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   377
  return AddressLiteral(address(obj), oop_Relocation::spec(oop_index));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   378
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   379
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   380
AddressLiteral MacroAssembler::constant_oop_address(jobject obj) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   381
  assert(oop_recorder() != NULL, "this assembler needs an OopRecorder");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   382
  int oop_index = oop_recorder()->find_index(obj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   383
  return AddressLiteral(address(obj), oop_Relocation::spec(oop_index));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   384
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   385
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   386
RegisterOrConstant MacroAssembler::delayed_value_impl(intptr_t* delayed_value_addr,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   387
                                                      Register tmp, int offset) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   388
  intptr_t value = *delayed_value_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   389
  if (value != 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   390
    return RegisterOrConstant(value + offset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   391
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   392
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   393
  // Load indirectly to solve generation ordering problem.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   394
  // static address, no relocation
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   395
  int simm16_offset = load_const_optimized(tmp, delayed_value_addr, noreg, true);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   396
  ld(tmp, simm16_offset, tmp); // must be aligned ((xa & 3) == 0)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   397
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   398
  if (offset != 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   399
    addi(tmp, tmp, offset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   400
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   401
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   402
  return RegisterOrConstant(tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   403
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   404
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   405
#ifndef PRODUCT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   406
void MacroAssembler::pd_print_patched_instruction(address branch) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   407
  Unimplemented(); // TODO: PPC port
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   408
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   409
#endif // ndef PRODUCT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   410
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   411
// Conditional far branch for destinations encodable in 24+2 bits.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   412
void MacroAssembler::bc_far(int boint, int biint, Label& dest, int optimize) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   413
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   414
  // If requested by flag optimize, relocate the bc_far as a
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   415
  // runtime_call and prepare for optimizing it when the code gets
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   416
  // relocated.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   417
  if (optimize == bc_far_optimize_on_relocate) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   418
    relocate(relocInfo::runtime_call_type);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   419
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   420
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   421
  // variant 2:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   422
  //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   423
  //    b!cxx SKIP
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   424
  //    bxx   DEST
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   425
  //  SKIP:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   426
  //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   427
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   428
  const int opposite_boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(boint)),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   429
                                                opposite_bcond(inv_boint_bcond(boint)));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   430
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   431
  // We emit two branches.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   432
  // First, a conditional branch which jumps around the far branch.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   433
  const address not_taken_pc = pc() + 2 * BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   434
  const address bc_pc        = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   435
  bc(opposite_boint, biint, not_taken_pc);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   436
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   437
  const int bc_instr = *(int*)bc_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   438
  assert(not_taken_pc == (address)inv_bd_field(bc_instr, (intptr_t)bc_pc), "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   439
  assert(opposite_boint == inv_bo_field(bc_instr), "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   440
  assert(boint == add_bhint_to_boint(opposite_bhint(inv_boint_bhint(inv_bo_field(bc_instr))),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   441
                                     opposite_bcond(inv_boint_bcond(inv_bo_field(bc_instr)))),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   442
         "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   443
  assert(biint == inv_bi_field(bc_instr), "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   444
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   445
  // Second, an unconditional far branch which jumps to dest.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   446
  // Note: target(dest) remembers the current pc (see CodeSection::target)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   447
  //       and returns the current pc if the label is not bound yet; when
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   448
  //       the label gets bound, the unconditional far branch will be patched.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   449
  const address target_pc = target(dest);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   450
  const address b_pc  = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   451
  b(target_pc);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   452
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   453
  assert(not_taken_pc == pc(),                     "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   454
  assert(dest.is_bound() || target_pc == b_pc, "postcondition");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   455
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   456
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   457
// 1 or 2 instructions
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   458
void MacroAssembler::bc_far_optimized(int boint, int biint, Label& dest) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   459
  if (dest.is_bound() && is_within_range_of_bcxx(target(dest), pc())) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   460
    bc(boint, biint, dest);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   461
  } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   462
    bc_far(boint, biint, dest, MacroAssembler::bc_far_optimize_on_relocate);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   463
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   464
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   465
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   466
bool MacroAssembler::is_bc_far_at(address instruction_addr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   467
  return is_bc_far_variant1_at(instruction_addr) ||
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   468
         is_bc_far_variant2_at(instruction_addr) ||
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   469
         is_bc_far_variant3_at(instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   470
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   471
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   472
address MacroAssembler::get_dest_of_bc_far_at(address instruction_addr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   473
  if (is_bc_far_variant1_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   474
    const address instruction_1_addr = instruction_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   475
    const int instruction_1 = *(int*)instruction_1_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   476
    return (address)inv_bd_field(instruction_1, (intptr_t)instruction_1_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   477
  } else if (is_bc_far_variant2_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   478
    const address instruction_2_addr = instruction_addr + 4;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   479
    return bxx_destination(instruction_2_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   480
  } else if (is_bc_far_variant3_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   481
    return instruction_addr + 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   482
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   483
  // variant 4 ???
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   484
  ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   485
  return NULL;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   486
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   487
void MacroAssembler::set_dest_of_bc_far_at(address instruction_addr, address dest) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   488
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   489
  if (is_bc_far_variant3_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   490
    // variant 3, far cond branch to the next instruction, already patched to nops:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   491
    //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   492
    //    nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   493
    //    endgroup
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   494
    //  SKIP/DEST:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   495
    //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   496
    return;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   497
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   498
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   499
  // first, extract boint and biint from the current branch
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   500
  int boint = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   501
  int biint = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   502
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   503
  ResourceMark rm;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   504
  const int code_size = 2 * BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   505
  CodeBuffer buf(instruction_addr, code_size);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   506
  MacroAssembler masm(&buf);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   507
  if (is_bc_far_variant2_at(instruction_addr) && dest == instruction_addr + 8) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   508
    // Far branch to next instruction: Optimize it by patching nops (produce variant 3).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   509
    masm.nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   510
    masm.endgroup();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   511
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   512
    if (is_bc_far_variant1_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   513
      // variant 1, the 1st instruction contains the destination address:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   514
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   515
      //    bcxx  DEST
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   516
      //    nop
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   517
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   518
      const int instruction_1 = *(int*)(instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   519
      boint = inv_bo_field(instruction_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   520
      biint = inv_bi_field(instruction_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   521
    } else if (is_bc_far_variant2_at(instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   522
      // variant 2, the 2nd instruction contains the destination address:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   523
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   524
      //    b!cxx SKIP
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   525
      //    bxx   DEST
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   526
      //  SKIP:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   527
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   528
      const int instruction_1 = *(int*)(instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   529
      boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(inv_bo_field(instruction_1))),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   530
          opposite_bcond(inv_boint_bcond(inv_bo_field(instruction_1))));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   531
      biint = inv_bi_field(instruction_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   532
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   533
      // variant 4???
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   534
      ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   535
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   536
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   537
    // second, set the new branch destination and optimize the code
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   538
    if (dest != instruction_addr + 4 && // the bc_far is still unbound!
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   539
        masm.is_within_range_of_bcxx(dest, instruction_addr)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   540
      // variant 1:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   541
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   542
      //    bcxx  DEST
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   543
      //    nop
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   544
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   545
      masm.bc(boint, biint, dest);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   546
      masm.nop();
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   547
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   548
      // variant 2:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   549
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   550
      //    b!cxx SKIP
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   551
      //    bxx   DEST
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   552
      //  SKIP:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   553
      //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   554
      const int opposite_boint = add_bhint_to_boint(opposite_bhint(inv_boint_bhint(boint)),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   555
                                                    opposite_bcond(inv_boint_bcond(boint)));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   556
      const address not_taken_pc = masm.pc() + 2 * BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   557
      masm.bc(opposite_boint, biint, not_taken_pc);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   558
      masm.b(dest);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   559
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   560
  }
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   561
  ICache::ppc64_flush_icache_bytes(instruction_addr, code_size);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   562
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   563
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   564
// Emit a NOT mt-safe patchable 64 bit absolute call/jump.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   565
void MacroAssembler::bxx64_patchable(address dest, relocInfo::relocType rt, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   566
  // get current pc
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   567
  uint64_t start_pc = (uint64_t) pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   568
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   569
  const address pc_of_bl = (address) (start_pc + (6*BytesPerInstWord)); // bl is last
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   570
  const address pc_of_b  = (address) (start_pc + (0*BytesPerInstWord)); // b is first
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   571
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   572
  // relocate here
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   573
  if (rt != relocInfo::none) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   574
    relocate(rt);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   575
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   576
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   577
  if ( ReoptimizeCallSequences &&
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   578
       (( link && is_within_range_of_b(dest, pc_of_bl)) ||
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   579
        (!link && is_within_range_of_b(dest, pc_of_b)))) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   580
    // variant 2:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   581
    // Emit an optimized, pc-relative call/jump.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   582
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   583
    if (link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   584
      // some padding
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   585
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   586
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   587
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   588
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   589
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   590
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   591
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   592
      // do the call
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   593
      assert(pc() == pc_of_bl, "just checking");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   594
      bl(dest, relocInfo::none);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   595
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   596
      // do the jump
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   597
      assert(pc() == pc_of_b, "just checking");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   598
      b(dest, relocInfo::none);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   599
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   600
      // some padding
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   601
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   602
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   603
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   604
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   605
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   606
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   607
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   608
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   609
    // Assert that we can identify the emitted call/jump.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   610
    assert(is_bxx64_patchable_variant2_at((address)start_pc, link),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   611
           "can't identify emitted call");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   612
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   613
    // variant 1:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   614
    mr(R0, R11);  // spill R11 -> R0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   615
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   616
    // Load the destination address into CTR,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   617
    // calculate destination relative to global toc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   618
    calculate_address_from_global_toc(R11, dest, true, true, false);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   619
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   620
    mtctr(R11);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   621
    mr(R11, R0);  // spill R11 <- R0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   622
    nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   623
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   624
    // do the call/jump
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   625
    if (link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   626
      bctrl();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   627
    } else{
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   628
      bctr();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   629
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   630
    // Assert that we can identify the emitted call/jump.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   631
    assert(is_bxx64_patchable_variant1b_at((address)start_pc, link),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   632
           "can't identify emitted call");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   633
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   634
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   635
  // Assert that we can identify the emitted call/jump.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   636
  assert(is_bxx64_patchable_at((address)start_pc, link),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   637
         "can't identify emitted call");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   638
  assert(get_dest_of_bxx64_patchable_at((address)start_pc, link) == dest,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   639
         "wrong encoding of dest address");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   640
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   641
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   642
// Identify a bxx64_patchable instruction.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   643
bool MacroAssembler::is_bxx64_patchable_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   644
  return is_bxx64_patchable_variant1b_at(instruction_addr, link)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   645
    //|| is_bxx64_patchable_variant1_at(instruction_addr, link)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   646
      || is_bxx64_patchable_variant2_at(instruction_addr, link);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   647
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   648
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   649
// Does the call64_patchable instruction use a pc-relative encoding of
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   650
// the call destination?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   651
bool MacroAssembler::is_bxx64_patchable_pcrelative_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   652
  // variant 2 is pc-relative
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   653
  return is_bxx64_patchable_variant2_at(instruction_addr, link);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   654
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   655
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   656
// Identify variant 1.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   657
bool MacroAssembler::is_bxx64_patchable_variant1_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   658
  unsigned int* instr = (unsigned int*) instruction_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   659
  return (link ? is_bctrl(instr[6]) : is_bctr(instr[6])) // bctr[l]
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   660
      && is_mtctr(instr[5]) // mtctr
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   661
    && is_load_const_at(instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   662
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   663
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   664
// Identify variant 1b: load destination relative to global toc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   665
bool MacroAssembler::is_bxx64_patchable_variant1b_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   666
  unsigned int* instr = (unsigned int*) instruction_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   667
  return (link ? is_bctrl(instr[6]) : is_bctr(instr[6])) // bctr[l]
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   668
    && is_mtctr(instr[3]) // mtctr
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   669
    && is_calculate_address_from_global_toc_at(instruction_addr + 2*BytesPerInstWord, instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   670
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   671
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   672
// Identify variant 2.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   673
bool MacroAssembler::is_bxx64_patchable_variant2_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   674
  unsigned int* instr = (unsigned int*) instruction_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   675
  if (link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   676
    return is_bl (instr[6])  // bl dest is last
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   677
      && is_nop(instr[0])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   678
      && is_nop(instr[1])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   679
      && is_nop(instr[2])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   680
      && is_nop(instr[3])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   681
      && is_nop(instr[4])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   682
      && is_nop(instr[5]); // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   683
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   684
    return is_b  (instr[0])  // b  dest is first
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   685
      && is_nop(instr[1])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   686
      && is_nop(instr[2])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   687
      && is_nop(instr[3])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   688
      && is_nop(instr[4])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   689
      && is_nop(instr[5])  // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   690
      && is_nop(instr[6]); // nop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   691
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   692
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   693
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   694
// Set dest address of a bxx64_patchable instruction.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   695
void MacroAssembler::set_dest_of_bxx64_patchable_at(address instruction_addr, address dest, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   696
  ResourceMark rm;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   697
  int code_size = MacroAssembler::bxx64_patchable_size;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   698
  CodeBuffer buf(instruction_addr, code_size);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   699
  MacroAssembler masm(&buf);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   700
  masm.bxx64_patchable(dest, relocInfo::none, link);
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
   701
  ICache::ppc64_flush_icache_bytes(instruction_addr, code_size);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   702
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   703
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   704
// Get dest address of a bxx64_patchable instruction.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   705
address MacroAssembler::get_dest_of_bxx64_patchable_at(address instruction_addr, bool link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   706
  if (is_bxx64_patchable_variant1_at(instruction_addr, link)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   707
    return (address) (unsigned long) get_const(instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   708
  } else if (is_bxx64_patchable_variant2_at(instruction_addr, link)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   709
    unsigned int* instr = (unsigned int*) instruction_addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   710
    if (link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   711
      const int instr_idx = 6; // bl is last
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   712
      int branchoffset = branch_destination(instr[instr_idx], 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   713
      return instruction_addr + branchoffset + instr_idx*BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   714
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   715
      const int instr_idx = 0; // b is first
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   716
      int branchoffset = branch_destination(instr[instr_idx], 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   717
      return instruction_addr + branchoffset + instr_idx*BytesPerInstWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   718
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   719
  // Load dest relative to global toc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   720
  } else if (is_bxx64_patchable_variant1b_at(instruction_addr, link)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   721
    return get_address_of_calculate_address_from_global_toc_at(instruction_addr + 2*BytesPerInstWord,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   722
                                                               instruction_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   723
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   724
    ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   725
    return NULL;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   726
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   727
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   728
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   729
// Uses ordering which corresponds to ABI:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   730
//    _savegpr0_14:  std  r14,-144(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   731
//    _savegpr0_15:  std  r15,-136(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   732
//    _savegpr0_16:  std  r16,-128(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   733
void MacroAssembler::save_nonvolatile_gprs(Register dst, int offset) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   734
  std(R14, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   735
  std(R15, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   736
  std(R16, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   737
  std(R17, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   738
  std(R18, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   739
  std(R19, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   740
  std(R20, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   741
  std(R21, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   742
  std(R22, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   743
  std(R23, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   744
  std(R24, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   745
  std(R25, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   746
  std(R26, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   747
  std(R27, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   748
  std(R28, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   749
  std(R29, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   750
  std(R30, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   751
  std(R31, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   752
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   753
  stfd(F14, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   754
  stfd(F15, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   755
  stfd(F16, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   756
  stfd(F17, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   757
  stfd(F18, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   758
  stfd(F19, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   759
  stfd(F20, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   760
  stfd(F21, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   761
  stfd(F22, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   762
  stfd(F23, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   763
  stfd(F24, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   764
  stfd(F25, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   765
  stfd(F26, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   766
  stfd(F27, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   767
  stfd(F28, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   768
  stfd(F29, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   769
  stfd(F30, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   770
  stfd(F31, offset, dst);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   771
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   772
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   773
// Uses ordering which corresponds to ABI:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   774
//    _restgpr0_14:  ld   r14,-144(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   775
//    _restgpr0_15:  ld   r15,-136(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   776
//    _restgpr0_16:  ld   r16,-128(r1)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   777
void MacroAssembler::restore_nonvolatile_gprs(Register src, int offset) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   778
  ld(R14, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   779
  ld(R15, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   780
  ld(R16, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   781
  ld(R17, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   782
  ld(R18, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   783
  ld(R19, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   784
  ld(R20, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   785
  ld(R21, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   786
  ld(R22, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   787
  ld(R23, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   788
  ld(R24, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   789
  ld(R25, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   790
  ld(R26, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   791
  ld(R27, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   792
  ld(R28, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   793
  ld(R29, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   794
  ld(R30, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   795
  ld(R31, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   796
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   797
  // FP registers
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   798
  lfd(F14, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   799
  lfd(F15, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   800
  lfd(F16, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   801
  lfd(F17, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   802
  lfd(F18, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   803
  lfd(F19, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   804
  lfd(F20, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   805
  lfd(F21, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   806
  lfd(F22, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   807
  lfd(F23, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   808
  lfd(F24, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   809
  lfd(F25, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   810
  lfd(F26, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   811
  lfd(F27, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   812
  lfd(F28, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   813
  lfd(F29, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   814
  lfd(F30, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   815
  lfd(F31, offset, src);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   816
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   817
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   818
// For verify_oops.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   819
void MacroAssembler::save_volatile_gprs(Register dst, int offset) {
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
   820
  std(R2,  offset, dst);   offset += 8;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   821
  std(R3,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   822
  std(R4,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   823
  std(R5,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   824
  std(R6,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   825
  std(R7,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   826
  std(R8,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   827
  std(R9,  offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   828
  std(R10, offset, dst);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   829
  std(R11, offset, dst);   offset += 8;
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   830
  std(R12, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   831
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   832
  stfd(F0, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   833
  stfd(F1, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   834
  stfd(F2, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   835
  stfd(F3, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   836
  stfd(F4, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   837
  stfd(F5, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   838
  stfd(F6, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   839
  stfd(F7, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   840
  stfd(F8, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   841
  stfd(F9, offset, dst);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   842
  stfd(F10, offset, dst);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   843
  stfd(F11, offset, dst);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   844
  stfd(F12, offset, dst);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   845
  stfd(F13, offset, dst);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   846
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   847
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   848
// For verify_oops.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   849
void MacroAssembler::restore_volatile_gprs(Register src, int offset) {
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
   850
  ld(R2,  offset, src);   offset += 8;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   851
  ld(R3,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   852
  ld(R4,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   853
  ld(R5,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   854
  ld(R6,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   855
  ld(R7,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   856
  ld(R8,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   857
  ld(R9,  offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   858
  ld(R10, offset, src);   offset += 8;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   859
  ld(R11, offset, src);   offset += 8;
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   860
  ld(R12, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   861
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   862
  lfd(F0, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   863
  lfd(F1, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   864
  lfd(F2, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   865
  lfd(F3, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   866
  lfd(F4, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   867
  lfd(F5, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   868
  lfd(F6, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   869
  lfd(F7, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   870
  lfd(F8, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   871
  lfd(F9, offset, src);   offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   872
  lfd(F10, offset, src);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   873
  lfd(F11, offset, src);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   874
  lfd(F12, offset, src);  offset += 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   875
  lfd(F13, offset, src);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   876
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   877
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   878
void MacroAssembler::save_LR_CR(Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   879
  mfcr(tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   880
  std(tmp, _abi(cr), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   881
  mflr(tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   882
  std(tmp, _abi(lr), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   883
  // Tmp must contain lr on exit! (see return_addr and prolog in ppc64.ad)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   884
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   885
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   886
void MacroAssembler::restore_LR_CR(Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   887
  assert(tmp != R1_SP, "must be distinct");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   888
  ld(tmp, _abi(lr), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   889
  mtlr(tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   890
  ld(tmp, _abi(cr), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   891
  mtcr(tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   892
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   893
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   894
address MacroAssembler::get_PC_trash_LR(Register result) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   895
  Label L;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   896
  bl(L);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   897
  bind(L);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   898
  address lr_pc = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   899
  mflr(result);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   900
  return lr_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   901
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   902
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   903
void MacroAssembler::resize_frame(Register offset, Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   904
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   905
  assert_different_registers(offset, tmp, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   906
  andi_(tmp, offset, frame::alignment_in_bytes-1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   907
  asm_assert_eq("resize_frame: unaligned", 0x204);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   908
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   909
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   910
  // tmp <- *(SP)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   911
  ld(tmp, _abi(callers_sp), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   912
  // addr <- SP + offset;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   913
  // *(addr) <- tmp;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   914
  // SP <- addr
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   915
  stdux(tmp, R1_SP, offset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   916
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   917
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   918
void MacroAssembler::resize_frame(int offset, Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   919
  assert(is_simm(offset, 16), "too big an offset");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   920
  assert_different_registers(tmp, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   921
  assert((offset & (frame::alignment_in_bytes-1))==0, "resize_frame: unaligned");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   922
  // tmp <- *(SP)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   923
  ld(tmp, _abi(callers_sp), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   924
  // addr <- SP + offset;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   925
  // *(addr) <- tmp;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   926
  // SP <- addr
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   927
  stdu(tmp, offset, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   928
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   929
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   930
void MacroAssembler::resize_frame_absolute(Register addr, Register tmp1, Register tmp2) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   931
  // (addr == tmp1) || (addr == tmp2) is allowed here!
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   932
  assert(tmp1 != tmp2, "must be distinct");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   933
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   934
  // compute offset w.r.t. current stack pointer
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   935
  // tmp_1 <- addr - SP (!)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   936
  subf(tmp1, R1_SP, addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   937
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   938
  // atomically update SP keeping back link.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   939
  resize_frame(tmp1/* offset */, tmp2/* tmp */);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   940
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   941
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   942
void MacroAssembler::push_frame(Register bytes, Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   943
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   944
  assert(bytes != R0, "r0 not allowed here");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   945
  andi_(R0, bytes, frame::alignment_in_bytes-1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   946
  asm_assert_eq("push_frame(Reg, Reg): unaligned", 0x203);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   947
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   948
  neg(tmp, bytes);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   949
  stdux(R1_SP, R1_SP, tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   950
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   951
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   952
// Push a frame of size `bytes'.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   953
void MacroAssembler::push_frame(unsigned int bytes, Register tmp) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   954
  long offset = align_addr(bytes, frame::alignment_in_bytes);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   955
  if (is_simm(-offset, 16)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   956
    stdu(R1_SP, -offset, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   957
  } else {
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
   958
    load_const_optimized(tmp, -offset);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   959
    stdux(R1_SP, R1_SP, tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   960
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   961
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   962
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   963
// Push a frame of size `bytes' plus abi_reg_args on top.
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   964
void MacroAssembler::push_frame_reg_args(unsigned int bytes, Register tmp) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   965
  push_frame(bytes + frame::abi_reg_args_size, tmp);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   966
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   967
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   968
// Setup up a new C frame with a spill area for non-volatile GPRs and
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   969
// additional space for local variables.
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   970
void MacroAssembler::push_frame_reg_args_nonvolatiles(unsigned int bytes,
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   971
                                                      Register tmp) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   972
  push_frame(bytes + frame::abi_reg_args_size + frame::spill_nonvolatiles_size, tmp);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   973
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   974
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   975
// Pop current C frame.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   976
void MacroAssembler::pop_frame() {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   977
  ld(R1_SP, _abi(callers_sp), R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   978
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
   979
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   980
#if defined(ABI_ELFv2)
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   981
address MacroAssembler::branch_to(Register r_function_entry, bool and_link) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   982
  // TODO(asmundak): make sure the caller uses R12 as function descriptor
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   983
  // most of the times.
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   984
  if (R12 != r_function_entry) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   985
    mr(R12, r_function_entry);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   986
  }
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   987
  mtctr(R12);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   988
  // Do a call or a branch.
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   989
  if (and_link) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   990
    bctrl();
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   991
  } else {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   992
    bctr();
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   993
  }
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   994
  _last_calls_return_pc = pc();
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   995
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   996
  return _last_calls_return_pc;
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   997
}
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   998
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
   999
// Call a C function via a function descriptor and use full C
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1000
// calling conventions. Updates and returns _last_calls_return_pc.
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1001
address MacroAssembler::call_c(Register r_function_entry) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1002
  return branch_to(r_function_entry, /*and_link=*/true);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1003
}
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1004
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1005
// For tail calls: only branch, don't link, so callee returns to caller of this function.
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1006
address MacroAssembler::call_c_and_return_to_caller(Register r_function_entry) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1007
  return branch_to(r_function_entry, /*and_link=*/false);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1008
}
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1009
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1010
address MacroAssembler::call_c(address function_entry, relocInfo::relocType rt) {
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1011
  load_const(R12, function_entry, R0);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1012
  return branch_to(R12,  /*and_link=*/true);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1013
}
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1014
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1015
#else
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1016
// Generic version of a call to C function via a function descriptor
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1017
// with variable support for C calling conventions (TOC, ENV, etc.).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1018
// Updates and returns _last_calls_return_pc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1019
address MacroAssembler::branch_to(Register function_descriptor, bool and_link, bool save_toc_before_call,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1020
                                  bool restore_toc_after_call, bool load_toc_of_callee, bool load_env_of_callee) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1021
  // we emit standard ptrgl glue code here
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1022
  assert((function_descriptor != R0), "function_descriptor cannot be R0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1023
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1024
  // retrieve necessary entries from the function descriptor
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1025
  ld(R0, in_bytes(FunctionDescriptor::entry_offset()), function_descriptor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1026
  mtctr(R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1027
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1028
  if (load_toc_of_callee) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1029
    ld(R2_TOC, in_bytes(FunctionDescriptor::toc_offset()), function_descriptor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1030
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1031
  if (load_env_of_callee) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1032
    ld(R11, in_bytes(FunctionDescriptor::env_offset()), function_descriptor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1033
  } else if (load_toc_of_callee) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1034
    li(R11, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1035
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1036
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1037
  // do a call or a branch
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1038
  if (and_link) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1039
    bctrl();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1040
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1041
    bctr();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1042
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1043
  _last_calls_return_pc = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1044
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1045
  return _last_calls_return_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1046
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1047
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1048
// Call a C function via a function descriptor and use full C calling
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1049
// conventions.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1050
// We don't use the TOC in generated code, so there is no need to save
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1051
// and restore its value.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1052
address MacroAssembler::call_c(Register fd) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1053
  return branch_to(fd, /*and_link=*/true,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1054
                       /*save toc=*/false,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1055
                       /*restore toc=*/false,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1056
                       /*load toc=*/true,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1057
                       /*load env=*/true);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1058
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1059
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1060
address MacroAssembler::call_c_and_return_to_caller(Register fd) {
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1061
  return branch_to(fd, /*and_link=*/false,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1062
                       /*save toc=*/false,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1063
                       /*restore toc=*/false,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1064
                       /*load toc=*/true,
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1065
                       /*load env=*/true);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1066
}
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  1067
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1068
address MacroAssembler::call_c(const FunctionDescriptor* fd, relocInfo::relocType rt) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1069
  if (rt != relocInfo::none) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1070
    // this call needs to be relocatable
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1071
    if (!ReoptimizeCallSequences
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1072
        || (rt != relocInfo::runtime_call_type && rt != relocInfo::none)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1073
        || fd == NULL   // support code-size estimation
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1074
        || !fd->is_friend_function()
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1075
        || fd->entry() == NULL) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1076
      // it's not a friend function as defined by class FunctionDescriptor,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1077
      // so do a full call-c here.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1078
      load_const(R11, (address)fd, R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1079
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1080
      bool has_env = (fd != NULL && fd->env() != NULL);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1081
      return branch_to(R11, /*and_link=*/true,
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1082
                            /*save toc=*/false,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1083
                            /*restore toc=*/false,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1084
                            /*load toc=*/true,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1085
                            /*load env=*/has_env);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1086
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1087
      // It's a friend function. Load the entry point and don't care about
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1088
      // toc and env. Use an optimizable call instruction, but ensure the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1089
      // same code-size as in the case of a non-friend function.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1090
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1091
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1092
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1093
      bl64_patchable(fd->entry(), rt);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1094
      _last_calls_return_pc = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1095
      return _last_calls_return_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1096
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1097
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1098
    // This call does not need to be relocatable, do more aggressive
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1099
    // optimizations.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1100
    if (!ReoptimizeCallSequences
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1101
      || !fd->is_friend_function()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1102
      // It's not a friend function as defined by class FunctionDescriptor,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1103
      // so do a full call-c here.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1104
      load_const(R11, (address)fd, R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1105
      return branch_to(R11, /*and_link=*/true,
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1106
                            /*save toc=*/false,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1107
                            /*restore toc=*/false,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1108
                            /*load toc=*/true,
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  1109
                            /*load env=*/true);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1110
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1111
      // it's a friend function, load the entry point and don't care about
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1112
      // toc and env.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1113
      address dest = fd->entry();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1114
      if (is_within_range_of_b(dest, pc())) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1115
        bl(dest);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1116
      } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1117
        bl64_patchable(dest, rt);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1118
      }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1119
      _last_calls_return_pc = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1120
      return _last_calls_return_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1121
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1122
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1123
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1124
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1125
// Call a C function.  All constants needed reside in TOC.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1126
//
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1127
// Read the address to call from the TOC.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1128
// Read env from TOC, if fd specifies an env.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1129
// Read new TOC from TOC.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1130
address MacroAssembler::call_c_using_toc(const FunctionDescriptor* fd,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1131
                                         relocInfo::relocType rt, Register toc) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1132
  if (!ReoptimizeCallSequences
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1133
    || (rt != relocInfo::runtime_call_type && rt != relocInfo::none)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1134
    || !fd->is_friend_function()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1135
    // It's not a friend function as defined by class FunctionDescriptor,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1136
    // so do a full call-c here.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1137
    assert(fd->entry() != NULL, "function must be linked");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1138
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1139
    AddressLiteral fd_entry(fd->entry());
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1140
    bool success = load_const_from_method_toc(R11, fd_entry, toc, /*fixed_size*/ true);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1141
    mtctr(R11);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1142
    if (fd->env() == NULL) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1143
      li(R11, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1144
      nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1145
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1146
      AddressLiteral fd_env(fd->env());
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1147
      success = success && load_const_from_method_toc(R11, fd_env, toc, /*fixed_size*/ true);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1148
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1149
    AddressLiteral fd_toc(fd->toc());
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1150
    // Set R2_TOC (load from toc)
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1151
    success = success && load_const_from_method_toc(R2_TOC, fd_toc, toc, /*fixed_size*/ true);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1152
    bctrl();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1153
    _last_calls_return_pc = pc();
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1154
    if (!success) { return NULL; }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1155
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1156
    // It's a friend function, load the entry point and don't care about
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1157
    // toc and env. Use an optimizable call instruction, but ensure the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1158
    // same code-size as in the case of a non-friend function.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1159
    nop();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1160
    bl64_patchable(fd->entry(), rt);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1161
    _last_calls_return_pc = pc();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1162
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1163
  return _last_calls_return_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1164
}
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  1165
#endif // ABI_ELFv2
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1166
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1167
void MacroAssembler::call_VM_base(Register oop_result,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1168
                                  Register last_java_sp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1169
                                  address  entry_point,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1170
                                  bool     check_exceptions) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1171
  BLOCK_COMMENT("call_VM {");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1172
  // Determine last_java_sp register.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1173
  if (!last_java_sp->is_valid()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1174
    last_java_sp = R1_SP;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1175
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1176
  set_top_ijava_frame_at_SP_as_last_Java_frame(last_java_sp, R11_scratch1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1177
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1178
  // ARG1 must hold thread address.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1179
  mr(R3_ARG1, R16_thread);
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1180
#if defined(ABI_ELFv2)
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1181
  address return_pc = call_c(entry_point, relocInfo::none);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1182
#else
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1183
  address return_pc = call_c((FunctionDescriptor*)entry_point, relocInfo::none);
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1184
#endif
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1185
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1186
  reset_last_Java_frame();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1187
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1188
  // Check for pending exceptions.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1189
  if (check_exceptions) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1190
    // We don't check for exceptions here.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1191
    ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1192
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1193
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1194
  // Get oop result if there is one and reset the value in the thread.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1195
  if (oop_result->is_valid()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1196
    get_vm_result(oop_result);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1197
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1198
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1199
  _last_calls_return_pc = return_pc;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1200
  BLOCK_COMMENT("} call_VM");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1201
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1202
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1203
void MacroAssembler::call_VM_leaf_base(address entry_point) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1204
  BLOCK_COMMENT("call_VM_leaf {");
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1205
#if defined(ABI_ELFv2)
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1206
  call_c(entry_point, relocInfo::none);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1207
#else
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1208
  call_c(CAST_FROM_FN_PTR(FunctionDescriptor*, entry_point), relocInfo::none);
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  1209
#endif
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1210
  BLOCK_COMMENT("} call_VM_leaf");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1211
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1212
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1213
void MacroAssembler::call_VM(Register oop_result, address entry_point, bool check_exceptions) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1214
  call_VM_base(oop_result, noreg, entry_point, check_exceptions);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1215
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1216
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1217
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1218
                             bool check_exceptions) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1219
  // R3_ARG1 is reserved for the thread.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1220
  mr_if_needed(R4_ARG2, arg_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1221
  call_VM(oop_result, entry_point, check_exceptions);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1222
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1223
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1224
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1, Register arg_2,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1225
                             bool check_exceptions) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1226
  // R3_ARG1 is reserved for the thread
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1227
  mr_if_needed(R4_ARG2, arg_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1228
  assert(arg_2 != R4_ARG2, "smashed argument");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1229
  mr_if_needed(R5_ARG3, arg_2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1230
  call_VM(oop_result, entry_point, check_exceptions);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1231
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1232
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1233
void MacroAssembler::call_VM(Register oop_result, address entry_point, Register arg_1, Register arg_2, Register arg_3,
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1234
                             bool check_exceptions) {
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1235
  // R3_ARG1 is reserved for the thread
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1236
  mr_if_needed(R4_ARG2, arg_1);
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1237
  assert(arg_2 != R4_ARG2, "smashed argument");
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1238
  mr_if_needed(R5_ARG3, arg_2);
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1239
  mr_if_needed(R6_ARG4, arg_3);
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1240
  call_VM(oop_result, entry_point, check_exceptions);
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1241
}
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  1242
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1243
void MacroAssembler::call_VM_leaf(address entry_point) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1244
  call_VM_leaf_base(entry_point);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1245
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1246
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1247
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1248
  mr_if_needed(R3_ARG1, arg_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1249
  call_VM_leaf(entry_point);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1250
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1251
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1252
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1, Register arg_2) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1253
  mr_if_needed(R3_ARG1, arg_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1254
  assert(arg_2 != R3_ARG1, "smashed argument");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1255
  mr_if_needed(R4_ARG2, arg_2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1256
  call_VM_leaf(entry_point);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1257
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1258
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1259
void MacroAssembler::call_VM_leaf(address entry_point, Register arg_1, Register arg_2, Register arg_3) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1260
  mr_if_needed(R3_ARG1, arg_1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1261
  assert(arg_2 != R3_ARG1, "smashed argument");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1262
  mr_if_needed(R4_ARG2, arg_2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1263
  assert(arg_3 != R3_ARG1 && arg_3 != R4_ARG2, "smashed argument");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1264
  mr_if_needed(R5_ARG3, arg_3);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1265
  call_VM_leaf(entry_point);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1266
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1267
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1268
// Check whether instruction is a read access to the polling page
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1269
// which was emitted by load_from_polling_page(..).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1270
bool MacroAssembler::is_load_from_polling_page(int instruction, void* ucontext,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1271
                                               address* polling_address_ptr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1272
  if (!is_ld(instruction))
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1273
    return false; // It's not a ld. Fail.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1274
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1275
  int rt = inv_rt_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1276
  int ra = inv_ra_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1277
  int ds = inv_ds_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1278
  if (!(ds == 0 && ra != 0 && rt == 0)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1279
    return false; // It's not a ld(r0, X, ra). Fail.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1280
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1281
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1282
  if (!ucontext) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1283
    // Set polling address.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1284
    if (polling_address_ptr != NULL) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1285
      *polling_address_ptr = NULL;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1286
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1287
    return true; // No ucontext given. Can't check value of ra. Assume true.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1288
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1289
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1290
#ifdef LINUX
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1291
  // Ucontext given. Check that register ra contains the address of
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1292
  // the safepoing polling page.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1293
  ucontext_t* uc = (ucontext_t*) ucontext;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1294
  // Set polling address.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1295
  address addr = (address)uc->uc_mcontext.regs->gpr[ra] + (ssize_t)ds;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1296
  if (polling_address_ptr != NULL) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1297
    *polling_address_ptr = addr;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1298
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1299
  return os::is_poll_address(addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1300
#else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1301
  // Not on Linux, ucontext must be NULL.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1302
  ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1303
  return false;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1304
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1305
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1306
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1307
bool MacroAssembler::is_memory_serialization(int instruction, JavaThread* thread, void* ucontext) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1308
#ifdef LINUX
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1309
  ucontext_t* uc = (ucontext_t*) ucontext;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1310
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1311
  if (is_stwx(instruction) || is_stwux(instruction)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1312
    int ra = inv_ra_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1313
    int rb = inv_rb_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1314
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1315
    // look up content of ra and rb in ucontext
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1316
    address ra_val=(address)uc->uc_mcontext.regs->gpr[ra];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1317
    long rb_val=(long)uc->uc_mcontext.regs->gpr[rb];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1318
    return os::is_memory_serialize_page(thread, ra_val+rb_val);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1319
  } else if (is_stw(instruction) || is_stwu(instruction)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1320
    int ra = inv_ra_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1321
    int d1 = inv_d1_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1322
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1323
    // look up content of ra in ucontext
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1324
    address ra_val=(address)uc->uc_mcontext.regs->gpr[ra];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1325
    return os::is_memory_serialize_page(thread, ra_val+d1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1326
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1327
    return false;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1328
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1329
#else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1330
  // workaround not needed on !LINUX :-)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1331
  ShouldNotCallThis();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1332
  return false;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1333
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1334
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1335
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1336
void MacroAssembler::bang_stack_with_offset(int offset) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1337
  // When increasing the stack, the old stack pointer will be written
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1338
  // to the new top of stack according to the PPC64 abi.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1339
  // Therefore, stack banging is not necessary when increasing
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1340
  // the stack by <= os::vm_page_size() bytes.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1341
  // When increasing the stack by a larger amount, this method is
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1342
  // called repeatedly to bang the intermediate pages.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1343
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1344
  // Stack grows down, caller passes positive offset.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1345
  assert(offset > 0, "must bang with positive offset");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1346
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1347
  long stdoffset = -offset;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1348
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1349
  if (is_simm(stdoffset, 16)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1350
    // Signed 16 bit offset, a simple std is ok.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1351
    if (UseLoadInstructionsForStackBangingPPC64) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1352
      ld(R0, (int)(signed short)stdoffset, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1353
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1354
      std(R0,(int)(signed short)stdoffset, R1_SP);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1355
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1356
  } else if (is_simm(stdoffset, 31)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1357
    const int hi = MacroAssembler::largeoffset_si16_si16_hi(stdoffset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1358
    const int lo = MacroAssembler::largeoffset_si16_si16_lo(stdoffset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1359
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1360
    Register tmp = R11;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1361
    addis(tmp, R1_SP, hi);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1362
    if (UseLoadInstructionsForStackBangingPPC64) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1363
      ld(R0,  lo, tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1364
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1365
      std(R0, lo, tmp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1366
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1367
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1368
    ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1369
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1370
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1371
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1372
// If instruction is a stack bang of the form
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1373
//    std    R0,    x(Ry),       (see bang_stack_with_offset())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1374
//    stdu   R1_SP, x(R1_SP),    (see push_frame(), resize_frame())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1375
// or stdux  R1_SP, Rx, R1_SP    (see push_frame(), resize_frame())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1376
// return the banged address. Otherwise, return 0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1377
address MacroAssembler::get_stack_bang_address(int instruction, void *ucontext) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1378
#ifdef LINUX
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1379
  ucontext_t* uc = (ucontext_t*) ucontext;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1380
  int rs = inv_rs_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1381
  int ra = inv_ra_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1382
  if (   (is_ld(instruction)   && rs == 0 &&  UseLoadInstructionsForStackBangingPPC64)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1383
      || (is_std(instruction)  && rs == 0 && !UseLoadInstructionsForStackBangingPPC64)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1384
      || (is_stdu(instruction) && rs == 1)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1385
    int ds = inv_ds_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1386
    // return banged address
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1387
    return ds+(address)uc->uc_mcontext.regs->gpr[ra];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1388
  } else if (is_stdux(instruction) && rs == 1) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1389
    int rb = inv_rb_field(instruction);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1390
    address sp = (address)uc->uc_mcontext.regs->gpr[1];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1391
    long rb_val = (long)uc->uc_mcontext.regs->gpr[rb];
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1392
    return ra != 1 || rb_val >= 0 ? NULL         // not a stack bang
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1393
                                  : sp + rb_val; // banged address
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1394
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1395
  return NULL; // not a stack bang
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1396
#else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1397
  // workaround not needed on !LINUX :-)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1398
  ShouldNotCallThis();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1399
  return NULL;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1400
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1401
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1402
38931
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1403
void MacroAssembler::reserved_stack_check(Register return_pc) {
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1404
  // Test if reserved zone needs to be enabled.
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1405
  Label no_reserved_zone_enabling;
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1406
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1407
  ld_ptr(R0, JavaThread::reserved_stack_activation_offset(), R16_thread);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1408
  cmpld(CCR0, R1_SP, R0);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1409
  blt_predict_taken(CCR0, no_reserved_zone_enabling);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1410
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1411
  // Enable reserved zone again, throw stack overflow exception.
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1412
  push_frame_reg_args(0, R0);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1413
  call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::enable_stack_reserved_zone), R16_thread);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1414
  pop_frame();
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1415
  mtlr(return_pc);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1416
  load_const_optimized(R0, StubRoutines::throw_delayed_StackOverflowError_entry());
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1417
  mtctr(R0);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1418
  bctr();
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1419
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1420
  should_not_reach_here();
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1421
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1422
  bind(no_reserved_zone_enabling);
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1423
}
3cf28d630349 8156923: [ppc] Implement "JEP 270: Reserved Stack Areas for Critical Sections".
goetz
parents: 38685
diff changeset
  1424
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1425
void MacroAssembler::getandsetd(Register dest_current_value, Register exchange_value, Register addr_base,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1426
                                bool cmpxchgx_hint) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1427
  Label retry;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1428
  bind(retry);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1429
  ldarx(dest_current_value, addr_base, cmpxchgx_hint);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1430
  stdcx_(exchange_value, addr_base);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1431
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1432
    bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1433
  } else {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1434
    bne(                  CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1435
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1436
}
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1437
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1438
void MacroAssembler::getandaddd(Register dest_current_value, Register inc_value, Register addr_base,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1439
                                Register tmp, bool cmpxchgx_hint) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1440
  Label retry;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1441
  bind(retry);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1442
  ldarx(dest_current_value, addr_base, cmpxchgx_hint);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1443
  add(tmp, dest_current_value, inc_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1444
  stdcx_(tmp, addr_base);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1445
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1446
    bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1447
  } else {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1448
    bne(                  CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1449
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1450
}
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1451
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1452
// Word/sub-word atomic helper functions
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1453
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1454
// Temps and addr_base are killed if size < 4 and processor does not support respective instructions.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1455
// Only signed types are supported with size < 4.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1456
// Atomic add always kills tmp1.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1457
void MacroAssembler::atomic_get_and_modify_generic(Register dest_current_value, Register exchange_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1458
                                                   Register addr_base, Register tmp1, Register tmp2, Register tmp3,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1459
                                                   bool cmpxchgx_hint, bool is_add, int size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1460
  // Sub-word instructions are available since Power 8.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1461
  // For older processors, instruction_type != size holds, and we
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1462
  // emulate the sub-word instructions by constructing a 4-byte value
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1463
  // that leaves the other bytes unchanged.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1464
  const int instruction_type = VM_Version::has_lqarx() ? size : 4;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1465
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1466
  Label retry;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1467
  Register shift_amount = noreg,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1468
           val32 = dest_current_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1469
           modval = is_add ? tmp1 : exchange_value;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1470
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1471
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1472
    assert_different_registers(tmp1, tmp2, tmp3, dest_current_value, exchange_value, addr_base);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1473
    modval = tmp1;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1474
    shift_amount = tmp2;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1475
    val32 = tmp3;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1476
    // Need some preperation: Compute shift amount, align address. Note: shorts must be 2 byte aligned.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1477
#ifdef VM_LITTLE_ENDIAN
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1478
    rldic(shift_amount, addr_base, 3, 64-5); // (dest & 3) * 8;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1479
    clrrdi(addr_base, addr_base, 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1480
#else
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1481
    xori(shift_amount, addr_base, (size == 1) ? 3 : 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1482
    clrrdi(addr_base, addr_base, 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1483
    rldic(shift_amount, shift_amount, 3, 64-5); // byte: ((3-dest) & 3) * 8; short: ((1-dest/2) & 1) * 16;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1484
#endif
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1485
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1486
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1487
  // atomic emulation loop
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1488
  bind(retry);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1489
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1490
  switch (instruction_type) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1491
    case 4: lwarx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1492
    case 2: lharx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1493
    case 1: lbarx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1494
    default: ShouldNotReachHere();
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1495
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1496
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1497
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1498
    srw(dest_current_value, val32, shift_amount);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1499
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1500
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1501
  if (is_add) { add(modval, dest_current_value, exchange_value); }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1502
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1503
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1504
    // Transform exchange value such that the replacement can be done by one xor instruction.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1505
    xorr(modval, dest_current_value, is_add ? modval : exchange_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1506
    clrldi(modval, modval, (size == 1) ? 56 : 48);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1507
    slw(modval, modval, shift_amount);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1508
    xorr(modval, val32, modval);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1509
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1510
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1511
  switch (instruction_type) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1512
    case 4: stwcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1513
    case 2: sthcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1514
    case 1: stbcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1515
    default: ShouldNotReachHere();
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1516
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1517
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1518
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1519
    bne_predict_not_taken(CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1520
  } else {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1521
    bne(                  CCR0, retry); // StXcx_ sets CCR0.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1522
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1523
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1524
  // l?arx zero-extends, but Java wants byte/short values sign-extended.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1525
  if (size == 1) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1526
    extsb(dest_current_value, dest_current_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1527
  } else if (size == 2) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1528
    extsh(dest_current_value, dest_current_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1529
  };
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1530
}
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1531
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1532
// Temps, addr_base and exchange_value are killed if size < 4 and processor does not support respective instructions.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1533
// Only signed types are supported with size < 4.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1534
void MacroAssembler::cmpxchg_loop_body(ConditionRegister flag, Register dest_current_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1535
                                       Register compare_value, Register exchange_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1536
                                       Register addr_base, Register tmp1, Register tmp2,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1537
                                       Label &retry, Label &failed, bool cmpxchgx_hint, int size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1538
  // Sub-word instructions are available since Power 8.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1539
  // For older processors, instruction_type != size holds, and we
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1540
  // emulate the sub-word instructions by constructing a 4-byte value
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1541
  // that leaves the other bytes unchanged.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1542
  const int instruction_type = VM_Version::has_lqarx() ? size : 4;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1543
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1544
  Register shift_amount = noreg,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1545
           val32 = dest_current_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1546
           modval = exchange_value;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1547
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1548
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1549
    assert_different_registers(tmp1, tmp2, dest_current_value, compare_value, exchange_value, addr_base);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1550
    shift_amount = tmp1;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1551
    val32 = tmp2;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1552
    modval = tmp2;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1553
    // Need some preperation: Compute shift amount, align address. Note: shorts must be 2 byte aligned.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1554
#ifdef VM_LITTLE_ENDIAN
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1555
    rldic(shift_amount, addr_base, 3, 64-5); // (dest & 3) * 8;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1556
    clrrdi(addr_base, addr_base, 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1557
#else
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1558
    xori(shift_amount, addr_base, (size == 1) ? 3 : 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1559
    clrrdi(addr_base, addr_base, 2);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1560
    rldic(shift_amount, shift_amount, 3, 64-5); // byte: ((3-dest) & 3) * 8; short: ((1-dest/2) & 1) * 16;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1561
#endif
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1562
    // Transform exchange value such that the replacement can be done by one xor instruction.
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1563
    xorr(exchange_value, compare_value, exchange_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1564
    clrldi(exchange_value, exchange_value, (size == 1) ? 56 : 48);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1565
    slw(exchange_value, exchange_value, shift_amount);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1566
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1567
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1568
  // atomic emulation loop
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1569
  bind(retry);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1570
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1571
  switch (instruction_type) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1572
    case 4: lwarx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1573
    case 2: lharx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1574
    case 1: lbarx(val32, addr_base, cmpxchgx_hint); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1575
    default: ShouldNotReachHere();
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1576
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1577
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1578
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1579
    srw(dest_current_value, val32, shift_amount);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1580
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1581
  if (size == 1) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1582
    extsb(dest_current_value, dest_current_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1583
  } else if (size == 2) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1584
    extsh(dest_current_value, dest_current_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1585
  };
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1586
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1587
  cmpw(flag, dest_current_value, compare_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1588
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1589
    bne_predict_not_taken(flag, failed);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1590
  } else {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1591
    bne(                  flag, failed);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1592
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1593
  // branch to done  => (flag == ne), (dest_current_value != compare_value)
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1594
  // fall through    => (flag == eq), (dest_current_value == compare_value)
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1595
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1596
  if (instruction_type != size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1597
    xorr(modval, val32, exchange_value);
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1598
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1599
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1600
  switch (instruction_type) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1601
    case 4: stwcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1602
    case 2: sthcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1603
    case 1: stbcx_(modval, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1604
    default: ShouldNotReachHere();
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1605
  }
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1606
}
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1607
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1608
// CmpxchgX sets condition register to cmpX(current, compare).
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1609
void MacroAssembler::cmpxchg_generic(ConditionRegister flag, Register dest_current_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1610
                                     Register compare_value, Register exchange_value,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1611
                                     Register addr_base, Register tmp1, Register tmp2,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1612
                                     int semantics, bool cmpxchgx_hint,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1613
                                     Register int_flag_success, bool contention_hint, bool weak, int size) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1614
  Label retry;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1615
  Label failed;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1616
  Label done;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1617
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1618
  // Save one branch if result is returned via register and
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1619
  // result register is different from the other ones.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1620
  bool use_result_reg    = (int_flag_success != noreg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1621
  bool preset_result_reg = (int_flag_success != dest_current_value && int_flag_success != compare_value &&
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1622
                            int_flag_success != exchange_value && int_flag_success != addr_base &&
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1623
                            int_flag_success != tmp1 && int_flag_success != tmp2);
38685
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1624
  assert(!weak || flag == CCR0, "weak only supported with CCR0");
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1625
  assert(size == 1 || size == 2 || size == 4, "unsupported");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1626
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1627
  if (use_result_reg && preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1628
    li(int_flag_success, 0); // preset (assume cas failed)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1629
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1630
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1631
  // Add simple guard in order to reduce risk of starving under high contention (recommended by IBM).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1632
  if (contention_hint) { // Don't try to reserve if cmp fails.
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1633
    switch (size) {
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1634
      case 1: lbz(dest_current_value, 0, addr_base); extsb(dest_current_value, dest_current_value); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1635
      case 2: lha(dest_current_value, 0, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1636
      case 4: lwz(dest_current_value, 0, addr_base); break;
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1637
      default: ShouldNotReachHere();
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1638
    }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1639
    cmpw(flag, dest_current_value, compare_value);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1640
    bne(flag, failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1641
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1642
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1643
  // release/fence semantics
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1644
  if (semantics & MemBarRel) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1645
    release();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1646
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1647
39444
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1648
  cmpxchg_loop_body(flag, dest_current_value, compare_value, exchange_value, addr_base, tmp1, tmp2,
2eae9b74c1f3 8159976: PPC64: Add missing intrinsics for sub-word atomics
mdoerr
parents: 38931
diff changeset
  1649
                    retry, failed, cmpxchgx_hint, size);
38685
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1650
  if (!weak || use_result_reg) {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1651
    if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1652
      bne_predict_not_taken(CCR0, weak ? failed : retry); // StXcx_ sets CCR0.
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1653
    } else {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1654
      bne(                  CCR0, weak ? failed : retry); // StXcx_ sets CCR0.
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1655
    }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1656
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1657
  // fall through    => (flag == eq), (dest_current_value == compare_value), (swapped)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1658
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1659
  // Result in register (must do this at the end because int_flag_success can be the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1660
  // same register as one above).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1661
  if (use_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1662
    li(int_flag_success, 1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1663
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1664
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1665
  if (semantics & MemBarFenceAfter) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1666
    fence();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1667
  } else if (semantics & MemBarAcq) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1668
    isync();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1669
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1670
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1671
  if (use_result_reg && !preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1672
    b(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1673
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1674
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1675
  bind(failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1676
  if (use_result_reg && !preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1677
    li(int_flag_success, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1678
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1679
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1680
  bind(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1681
  // (flag == ne) => (dest_current_value != compare_value), (!swapped)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1682
  // (flag == eq) => (dest_current_value == compare_value), ( swapped)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1683
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1684
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1685
// Preforms atomic compare exchange:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1686
//   if (compare_value == *addr_base)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1687
//     *addr_base = exchange_value
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1688
//     int_flag_success = 1;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1689
//   else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1690
//     int_flag_success = 0;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1691
//
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1692
// ConditionRegister flag       = cmp(compare_value, *addr_base)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1693
// Register dest_current_value  = *addr_base
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1694
// Register compare_value       Used to compare with value in memory
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1695
// Register exchange_value      Written to memory if compare_value == *addr_base
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1696
// Register addr_base           The memory location to compareXChange
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1697
// Register int_flag_success    Set to 1 if exchange_value was written to *addr_base
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1698
//
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1699
// To avoid the costly compare exchange the value is tested beforehand.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1700
// Several special cases exist to avoid that unnecessary information is generated.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1701
//
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1702
void MacroAssembler::cmpxchgd(ConditionRegister flag,
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  1703
                              Register dest_current_value, RegisterOrConstant compare_value, Register exchange_value,
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1704
                              Register addr_base, int semantics, bool cmpxchgx_hint,
38685
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1705
                              Register int_flag_success, Label* failed_ext, bool contention_hint, bool weak) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1706
  Label retry;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1707
  Label failed_int;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1708
  Label& failed = (failed_ext != NULL) ? *failed_ext : failed_int;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1709
  Label done;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1710
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1711
  // Save one branch if result is returned via register and result register is different from the other ones.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1712
  bool use_result_reg    = (int_flag_success!=noreg);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  1713
  bool preset_result_reg = (int_flag_success!=dest_current_value && int_flag_success!=compare_value.register_or_noreg() &&
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1714
                            int_flag_success!=exchange_value && int_flag_success!=addr_base);
38685
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1715
  assert(!weak || flag == CCR0, "weak only supported with CCR0");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1716
  assert(int_flag_success == noreg || failed_ext == NULL, "cannot have both");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1717
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1718
  if (use_result_reg && preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1719
    li(int_flag_success, 0); // preset (assume cas failed)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1720
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1721
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1722
  // Add simple guard in order to reduce risk of starving under high contention (recommended by IBM).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1723
  if (contention_hint) { // Don't try to reserve if cmp fails.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1724
    ld(dest_current_value, 0, addr_base);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  1725
    cmpd(flag, compare_value, dest_current_value);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1726
    bne(flag, failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1727
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1728
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1729
  // release/fence semantics
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1730
  if (semantics & MemBarRel) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1731
    release();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1732
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1733
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1734
  // atomic emulation loop
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1735
  bind(retry);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1736
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1737
  ldarx(dest_current_value, addr_base, cmpxchgx_hint);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  1738
  cmpd(flag, compare_value, dest_current_value);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1739
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1740
    bne_predict_not_taken(flag, failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1741
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1742
    bne(                  flag, failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1743
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1744
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1745
  stdcx_(exchange_value, addr_base);
38685
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1746
  if (!weak || use_result_reg || failed_ext) {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1747
    if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1748
      bne_predict_not_taken(CCR0, weak ? failed : retry); // stXcx_ sets CCR0
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1749
    } else {
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1750
      bne(                  CCR0, weak ? failed : retry); // stXcx_ sets CCR0
e34308190947 8141635: Implement VarHandles/Unsafe intrinsics on POWER
mdoerr
parents: 38074
diff changeset
  1751
    }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1752
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1753
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1754
  // result in register (must do this at the end because int_flag_success can be the same register as one above)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1755
  if (use_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1756
    li(int_flag_success, 1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1757
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1758
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1759
  if (semantics & MemBarFenceAfter) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1760
    fence();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1761
  } else if (semantics & MemBarAcq) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1762
    isync();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1763
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1764
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1765
  if (use_result_reg && !preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1766
    b(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1767
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1768
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1769
  bind(failed_int);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1770
  if (use_result_reg && !preset_result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1771
    li(int_flag_success, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1772
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1773
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1774
  bind(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1775
  // (flag == ne) => (dest_current_value != compare_value), (!swapped)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1776
  // (flag == eq) => (dest_current_value == compare_value), ( swapped)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1777
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1778
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1779
// Look up the method for a megamorphic invokeinterface call.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1780
// The target method is determined by <intf_klass, itable_index>.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1781
// The receiver klass is in recv_klass.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1782
// On success, the result will be in method_result, and execution falls through.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1783
// On failure, execution transfers to the given label.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1784
void MacroAssembler::lookup_interface_method(Register recv_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1785
                                             Register intf_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1786
                                             RegisterOrConstant itable_index,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1787
                                             Register method_result,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1788
                                             Register scan_temp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1789
                                             Register sethi_temp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1790
                                             Label& L_no_such_interface) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1791
  assert_different_registers(recv_klass, intf_klass, method_result, scan_temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1792
  assert(itable_index.is_constant() || itable_index.as_register() == method_result,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1793
         "caller must use same register for non-constant itable index as for method");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1794
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1795
  // Compute start of first itableOffsetEntry (which is at the end of the vtable).
35899
0dbc821628fc 8148047: Move the vtable length field to Klass
mgerdin
parents: 35871
diff changeset
  1796
  int vtable_base = in_bytes(Klass::vtable_start_offset());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1797
  int itentry_off = itableMethodEntry::method_offset_in_bytes();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1798
  int logMEsize   = exact_log2(itableMethodEntry::size() * wordSize);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1799
  int scan_step   = itableOffsetEntry::size() * wordSize;
35871
607bf949dfb3 8147461: Use byte offsets for vtable start and vtable length offsets
mgerdin
parents: 35232
diff changeset
  1800
  int log_vte_size= exact_log2(vtableEntry::size_in_bytes());
607bf949dfb3 8147461: Use byte offsets for vtable start and vtable length offsets
mgerdin
parents: 35232
diff changeset
  1801
35899
0dbc821628fc 8148047: Move the vtable length field to Klass
mgerdin
parents: 35871
diff changeset
  1802
  lwz(scan_temp, in_bytes(Klass::vtable_length_offset()), recv_klass);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1803
  // %%% We should store the aligned, prescaled offset in the klassoop.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1804
  // Then the next several instructions would fold away.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1805
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1806
  sldi(scan_temp, scan_temp, log_vte_size);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1807
  addi(scan_temp, scan_temp, vtable_base);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1808
  add(scan_temp, recv_klass, scan_temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1809
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1810
  // Adjust recv_klass by scaled itable_index, so we can free itable_index.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1811
  if (itable_index.is_register()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1812
    Register itable_offset = itable_index.as_register();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1813
    sldi(itable_offset, itable_offset, logMEsize);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1814
    if (itentry_off) addi(itable_offset, itable_offset, itentry_off);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1815
    add(recv_klass, itable_offset, recv_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1816
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1817
    long itable_offset = (long)itable_index.as_constant();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1818
    load_const_optimized(sethi_temp, (itable_offset<<logMEsize)+itentry_off); // static address, no relocation
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1819
    add(recv_klass, sethi_temp, recv_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1820
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1821
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1822
  // for (scan = klass->itable(); scan->interface() != NULL; scan += scan_step) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1823
  //   if (scan->interface() == intf) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1824
  //     result = (klass + scan->offset() + itable_index);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1825
  //   }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1826
  // }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1827
  Label search, found_method;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1828
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1829
  for (int peel = 1; peel >= 0; peel--) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1830
    // %%%% Could load both offset and interface in one ldx, if they were
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1831
    // in the opposite order. This would save a load.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1832
    ld(method_result, itableOffsetEntry::interface_offset_in_bytes(), scan_temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1833
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1834
    // Check that this entry is non-null. A null entry means that
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1835
    // the receiver class doesn't implement the interface, and wasn't the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1836
    // same as when the caller was compiled.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1837
    cmpd(CCR0, method_result, intf_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1838
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1839
    if (peel) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1840
      beq(CCR0, found_method);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1841
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1842
      bne(CCR0, search);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1843
      // (invert the test to fall through to found_method...)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1844
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1845
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1846
    if (!peel) break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1847
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1848
    bind(search);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1849
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1850
    cmpdi(CCR0, method_result, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1851
    beq(CCR0, L_no_such_interface);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1852
    addi(scan_temp, scan_temp, scan_step);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1853
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1854
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1855
  bind(found_method);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1856
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1857
  // Got a hit.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1858
  int ito_offset = itableOffsetEntry::offset_offset_in_bytes();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1859
  lwz(scan_temp, ito_offset, scan_temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1860
  ldx(method_result, scan_temp, recv_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1861
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1862
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1863
// virtual method calling
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1864
void MacroAssembler::lookup_virtual_method(Register recv_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1865
                                           RegisterOrConstant vtable_index,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1866
                                           Register method_result) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1867
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1868
  assert_different_registers(recv_klass, method_result, vtable_index.register_or_noreg());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1869
35899
0dbc821628fc 8148047: Move the vtable length field to Klass
mgerdin
parents: 35871
diff changeset
  1870
  const int base = in_bytes(Klass::vtable_start_offset());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1871
  assert(vtableEntry::size() * wordSize == wordSize, "adjust the scaling in the code below");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1872
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1873
  if (vtable_index.is_register()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1874
    sldi(vtable_index.as_register(), vtable_index.as_register(), LogBytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1875
    add(recv_klass, vtable_index.as_register(), recv_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1876
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1877
    addi(recv_klass, recv_klass, vtable_index.as_constant() << LogBytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1878
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1879
  ld(R19_method, base + vtableEntry::method_offset_in_bytes(), recv_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1880
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1881
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1882
/////////////////////////////////////////// subtype checking ////////////////////////////////////////////
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1883
void MacroAssembler::check_klass_subtype_fast_path(Register sub_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1884
                                                   Register super_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1885
                                                   Register temp1_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1886
                                                   Register temp2_reg,
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1887
                                                   Label* L_success,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1888
                                                   Label* L_failure,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1889
                                                   Label* L_slow_path,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1890
                                                   RegisterOrConstant super_check_offset) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1891
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1892
  const Register check_cache_offset = temp1_reg;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1893
  const Register cached_super       = temp2_reg;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1894
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1895
  assert_different_registers(sub_klass, super_klass, check_cache_offset, cached_super);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1896
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1897
  int sco_offset = in_bytes(Klass::super_check_offset_offset());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1898
  int sc_offset  = in_bytes(Klass::secondary_super_cache_offset());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1899
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1900
  bool must_load_sco = (super_check_offset.constant_or_zero() == -1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1901
  bool need_slow_path = (must_load_sco || super_check_offset.constant_or_zero() == sco_offset);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1902
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1903
  Label L_fallthrough;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1904
  int label_nulls = 0;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1905
  if (L_success == NULL)   { L_success   = &L_fallthrough; label_nulls++; }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1906
  if (L_failure == NULL)   { L_failure   = &L_fallthrough; label_nulls++; }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1907
  if (L_slow_path == NULL) { L_slow_path = &L_fallthrough; label_nulls++; }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1908
  assert(label_nulls <= 1 ||
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1909
         (L_slow_path == &L_fallthrough && label_nulls <= 2 && !need_slow_path),
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1910
         "at most one NULL in the batch, usually");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1911
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1912
  // If the pointers are equal, we are done (e.g., String[] elements).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1913
  // This self-check enables sharing of secondary supertype arrays among
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1914
  // non-primary types such as array-of-interface. Otherwise, each such
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1915
  // type would need its own customized SSA.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1916
  // We move this check to the front of the fast path because many
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1917
  // type checks are in fact trivially successful in this manner,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1918
  // so we get a nicely predicted branch right at the start of the check.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1919
  cmpd(CCR0, sub_klass, super_klass);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1920
  beq(CCR0, *L_success);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1921
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1922
  // Check the supertype display:
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1923
  if (must_load_sco) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1924
    // The super check offset is always positive...
42068
18c8a4d5998e 8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents: 41334
diff changeset
  1925
    lwz(check_cache_offset, sco_offset, super_klass);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1926
    super_check_offset = RegisterOrConstant(check_cache_offset);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1927
    // super_check_offset is register.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1928
    assert_different_registers(sub_klass, super_klass, cached_super, super_check_offset.as_register());
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1929
  }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1930
  // The loaded value is the offset from KlassOopDesc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1931
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1932
  ld(cached_super, super_check_offset, sub_klass);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1933
  cmpd(CCR0, cached_super, super_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1934
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1935
  // This check has worked decisively for primary supers.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1936
  // Secondary supers are sought in the super_cache ('super_cache_addr').
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1937
  // (Secondary supers are interfaces and very deeply nested subtypes.)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1938
  // This works in the same check above because of a tricky aliasing
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1939
  // between the super_cache and the primary super display elements.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1940
  // (The 'super_check_addr' can address either, as the case requires.)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1941
  // Note that the cache is updated below if it does not help us find
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1942
  // what we need immediately.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1943
  // So if it was a primary super, we can just fail immediately.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1944
  // Otherwise, it's the slow path for us (no success at this point).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1945
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1946
#define FINAL_JUMP(label) if (&(label) != &L_fallthrough) { b(label); }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1947
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1948
  if (super_check_offset.is_register()) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1949
    beq(CCR0, *L_success);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1950
    cmpwi(CCR0, super_check_offset.as_register(), sc_offset);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1951
    if (L_failure == &L_fallthrough) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1952
      beq(CCR0, *L_slow_path);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1953
    } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1954
      bne(CCR0, *L_failure);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1955
      FINAL_JUMP(*L_slow_path);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1956
    }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1957
  } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1958
    if (super_check_offset.as_constant() == sc_offset) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1959
      // Need a slow path; fast failure is impossible.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1960
      if (L_slow_path == &L_fallthrough) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1961
        beq(CCR0, *L_success);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1962
      } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1963
        bne(CCR0, *L_slow_path);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1964
        FINAL_JUMP(*L_success);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1965
      }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1966
    } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1967
      // No slow path; it's a fast decision.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1968
      if (L_failure == &L_fallthrough) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1969
        beq(CCR0, *L_success);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1970
      } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1971
        bne(CCR0, *L_failure);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1972
        FINAL_JUMP(*L_success);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1973
      }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1974
    }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1975
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1976
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1977
  bind(L_fallthrough);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  1978
#undef FINAL_JUMP
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1979
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1980
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1981
void MacroAssembler::check_klass_subtype_slow_path(Register sub_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1982
                                                   Register super_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1983
                                                   Register temp1_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1984
                                                   Register temp2_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1985
                                                   Label* L_success,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1986
                                                   Register result_reg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1987
  const Register array_ptr = temp1_reg; // current value from cache array
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1988
  const Register temp      = temp2_reg;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1989
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1990
  assert_different_registers(sub_klass, super_klass, array_ptr, temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1991
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1992
  int source_offset = in_bytes(Klass::secondary_supers_offset());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1993
  int target_offset = in_bytes(Klass::secondary_super_cache_offset());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1994
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1995
  int length_offset = Array<Klass*>::length_offset_in_bytes();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1996
  int base_offset   = Array<Klass*>::base_offset_in_bytes();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1997
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1998
  Label hit, loop, failure, fallthru;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  1999
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2000
  ld(array_ptr, source_offset, sub_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2001
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2002
  // TODO: PPC port: assert(4 == arrayOopDesc::length_length_in_bytes(), "precondition violated.");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2003
  lwz(temp, length_offset, array_ptr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2004
  cmpwi(CCR0, temp, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2005
  beq(CCR0, result_reg!=noreg ? failure : fallthru); // length 0
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2006
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2007
  mtctr(temp); // load ctr
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2008
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2009
  bind(loop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2010
  // Oops in table are NO MORE compressed.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2011
  ld(temp, base_offset, array_ptr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2012
  cmpd(CCR0, temp, super_klass);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2013
  beq(CCR0, hit);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2014
  addi(array_ptr, array_ptr, BytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2015
  bdnz(loop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2016
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2017
  bind(failure);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2018
  if (result_reg!=noreg) li(result_reg, 1); // load non-zero result (indicates a miss)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2019
  b(fallthru);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2020
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2021
  bind(hit);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2022
  std(super_klass, target_offset, sub_klass); // save result to cache
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2023
  if (result_reg != noreg) { li(result_reg, 0); } // load zero result (indicates a hit)
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2024
  if (L_success != NULL) { b(*L_success); }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2025
  else if (result_reg == noreg) { blr(); } // return with CR0.eq if neither label nor result reg provided
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2026
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2027
  bind(fallthru);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2028
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2029
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2030
// Try fast path, then go to slow one if not successful
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2031
void MacroAssembler::check_klass_subtype(Register sub_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2032
                         Register super_klass,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2033
                         Register temp1_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2034
                         Register temp2_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2035
                         Label& L_success) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2036
  Label L_failure;
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2037
  check_klass_subtype_fast_path(sub_klass, super_klass, temp1_reg, temp2_reg, &L_success, &L_failure);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2038
  check_klass_subtype_slow_path(sub_klass, super_klass, temp1_reg, temp2_reg, &L_success);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2039
  bind(L_failure); // Fallthru if not successful.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2040
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2041
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2042
void MacroAssembler::check_method_handle_type(Register mtype_reg, Register mh_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2043
                                              Register temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2044
                                              Label& wrong_method_type) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2045
  assert_different_registers(mtype_reg, mh_reg, temp_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2046
  // Compare method type against that of the receiver.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2047
  load_heap_oop_not_null(temp_reg, delayed_value(java_lang_invoke_MethodHandle::type_offset_in_bytes, temp_reg), mh_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2048
  cmpd(CCR0, temp_reg, mtype_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2049
  bne(CCR0, wrong_method_type);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2050
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2051
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2052
RegisterOrConstant MacroAssembler::argument_offset(RegisterOrConstant arg_slot,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2053
                                                   Register temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2054
                                                   int extra_slot_offset) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2055
  // cf. TemplateTable::prepare_invoke(), if (load_receiver).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2056
  int stackElementSize = Interpreter::stackElementSize;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2057
  int offset = extra_slot_offset * stackElementSize;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2058
  if (arg_slot.is_constant()) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2059
    offset += arg_slot.as_constant() * stackElementSize;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2060
    return offset;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2061
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2062
    assert(temp_reg != noreg, "must specify");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2063
    sldi(temp_reg, arg_slot.as_register(), exact_log2(stackElementSize));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2064
    if (offset != 0)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2065
      addi(temp_reg, temp_reg, offset);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2066
    return temp_reg;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2067
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2068
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2069
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2070
// Supports temp2_reg = R0.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2071
void MacroAssembler::biased_locking_enter(ConditionRegister cr_reg, Register obj_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2072
                                          Register mark_reg, Register temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2073
                                          Register temp2_reg, Label& done, Label* slow_case) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2074
  assert(UseBiasedLocking, "why call this otherwise?");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2075
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2076
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2077
  assert_different_registers(obj_reg, mark_reg, temp_reg, temp2_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2078
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2079
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2080
  Label cas_label;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2081
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2082
  // Branch to done if fast path fails and no slow_case provided.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2083
  Label *slow_case_int = (slow_case != NULL) ? slow_case : &done;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2084
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2085
  // Biased locking
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2086
  // See whether the lock is currently biased toward our thread and
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2087
  // whether the epoch is still valid
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2088
  // Note that the runtime guarantees sufficient alignment of JavaThread
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2089
  // pointers to allow age to be placed into low bits
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2090
  assert(markOopDesc::age_shift == markOopDesc::lock_bits + markOopDesc::biased_lock_bits,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2091
         "biased locking makes assumptions about bit layout");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2092
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2093
  if (PrintBiasedLockingStatistics) {
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2094
    load_const(temp2_reg, (address) BiasedLocking::total_entry_count_addr(), temp_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2095
    lwzx(temp_reg, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2096
    addi(temp_reg, temp_reg, 1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2097
    stwx(temp_reg, temp2_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2098
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2099
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2100
  andi(temp_reg, mark_reg, markOopDesc::biased_lock_mask_in_place);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2101
  cmpwi(cr_reg, temp_reg, markOopDesc::biased_lock_pattern);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2102
  bne(cr_reg, cas_label);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2103
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  2104
  load_klass(temp_reg, obj_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2105
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2106
  load_const_optimized(temp2_reg, ~((int) markOopDesc::age_mask_in_place));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2107
  ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2108
  orr(temp_reg, R16_thread, temp_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2109
  xorr(temp_reg, mark_reg, temp_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2110
  andr(temp_reg, temp_reg, temp2_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2111
  cmpdi(cr_reg, temp_reg, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2112
  if (PrintBiasedLockingStatistics) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2113
    Label l;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2114
    bne(cr_reg, l);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2115
    load_const(temp2_reg, (address) BiasedLocking::biased_lock_entry_count_addr());
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2116
    lwzx(mark_reg, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2117
    addi(mark_reg, mark_reg, 1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2118
    stwx(mark_reg, temp2_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2119
    // restore mark_reg
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2120
    ld(mark_reg, oopDesc::mark_offset_in_bytes(), obj_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2121
    bind(l);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2122
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2123
  beq(cr_reg, done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2124
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2125
  Label try_revoke_bias;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2126
  Label try_rebias;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2127
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2128
  // At this point we know that the header has the bias pattern and
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2129
  // that we are not the bias owner in the current epoch. We need to
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2130
  // figure out more details about the state of the header in order to
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2131
  // know what operations can be legally performed on the object's
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2132
  // header.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2133
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2134
  // If the low three bits in the xor result aren't clear, that means
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2135
  // the prototype header is no longer biased and we have to revoke
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2136
  // the bias on this object.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2137
  andi(temp2_reg, temp_reg, markOopDesc::biased_lock_mask_in_place);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2138
  cmpwi(cr_reg, temp2_reg, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2139
  bne(cr_reg, try_revoke_bias);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2140
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2141
  // Biasing is still enabled for this data type. See whether the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2142
  // epoch of the current bias is still valid, meaning that the epoch
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2143
  // bits of the mark word are equal to the epoch bits of the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2144
  // prototype header. (Note that the prototype header's epoch bits
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2145
  // only change at a safepoint.) If not, attempt to rebias the object
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2146
  // toward the current thread. Note that we must be absolutely sure
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2147
  // that the current epoch is invalid in order to do this because
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2148
  // otherwise the manipulations it performs on the mark word are
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2149
  // illegal.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2150
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2151
  int shift_amount = 64 - markOopDesc::epoch_shift;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2152
  // rotate epoch bits to right (little) end and set other bits to 0
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2153
  // [ big part | epoch | little part ] -> [ 0..0 | epoch ]
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2154
  rldicl_(temp2_reg, temp_reg, shift_amount, 64 - markOopDesc::epoch_bits);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2155
  // branch if epoch bits are != 0, i.e. they differ, because the epoch has been incremented
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2156
  bne(CCR0, try_rebias);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2157
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2158
  // The epoch of the current bias is still valid but we know nothing
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2159
  // about the owner; it might be set or it might be clear. Try to
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2160
  // acquire the bias of the object using an atomic operation. If this
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2161
  // fails we will go in to the runtime to revoke the object's bias.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2162
  // Note that we first construct the presumed unbiased header so we
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2163
  // don't accidentally blow away another thread's valid bias.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2164
  andi(mark_reg, mark_reg, (markOopDesc::biased_lock_mask_in_place |
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2165
                                markOopDesc::age_mask_in_place |
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2166
                                markOopDesc::epoch_mask_in_place));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2167
  orr(temp_reg, R16_thread, mark_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2168
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2169
  assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2170
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2171
  // CmpxchgX sets cr_reg to cmpX(temp2_reg, mark_reg).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2172
  cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2173
           /*compare_value=*/mark_reg, /*exchange_value=*/temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2174
           /*where=*/obj_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2175
           MacroAssembler::MemBarAcq,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2176
           MacroAssembler::cmpxchgx_hint_acquire_lock(),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2177
           noreg, slow_case_int); // bail out if failed
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2178
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2179
  // If the biasing toward our thread failed, this means that
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2180
  // another thread succeeded in biasing it toward itself and we
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2181
  // need to revoke that bias. The revocation will occur in the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2182
  // interpreter runtime in the slow case.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2183
  if (PrintBiasedLockingStatistics) {
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2184
    load_const(temp2_reg, (address) BiasedLocking::anonymously_biased_lock_entry_count_addr(), temp_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2185
    lwzx(temp_reg, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2186
    addi(temp_reg, temp_reg, 1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2187
    stwx(temp_reg, temp2_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2188
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2189
  b(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2190
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2191
  bind(try_rebias);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2192
  // At this point we know the epoch has expired, meaning that the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2193
  // current "bias owner", if any, is actually invalid. Under these
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2194
  // circumstances _only_, we are allowed to use the current header's
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2195
  // value as the comparison value when doing the cas to acquire the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2196
  // bias in the current epoch. In other words, we allow transfer of
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2197
  // the bias from one thread to another directly in this situation.
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2198
  load_klass(temp_reg, obj_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2199
  andi(temp2_reg, mark_reg, markOopDesc::age_mask_in_place);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2200
  orr(temp2_reg, R16_thread, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2201
  ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2202
  orr(temp_reg, temp2_reg, temp_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2203
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2204
  assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2205
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2206
  cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2207
                 /*compare_value=*/mark_reg, /*exchange_value=*/temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2208
                 /*where=*/obj_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2209
                 MacroAssembler::MemBarAcq,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2210
                 MacroAssembler::cmpxchgx_hint_acquire_lock(),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2211
                 noreg, slow_case_int); // bail out if failed
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2212
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2213
  // If the biasing toward our thread failed, this means that
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2214
  // another thread succeeded in biasing it toward itself and we
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2215
  // need to revoke that bias. The revocation will occur in the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2216
  // interpreter runtime in the slow case.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2217
  if (PrintBiasedLockingStatistics) {
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2218
    load_const(temp2_reg, (address) BiasedLocking::rebiased_lock_entry_count_addr(), temp_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2219
    lwzx(temp_reg, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2220
    addi(temp_reg, temp_reg, 1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2221
    stwx(temp_reg, temp2_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2222
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2223
  b(done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2224
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2225
  bind(try_revoke_bias);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2226
  // The prototype mark in the klass doesn't have the bias bit set any
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2227
  // more, indicating that objects of this data type are not supposed
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2228
  // to be biased any more. We are going to try to reset the mark of
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2229
  // this object to the prototype value and fall through to the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2230
  // CAS-based locking scheme. Note that if our CAS fails, it means
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2231
  // that another thread raced us for the privilege of revoking the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2232
  // bias of this particular object, so it's okay to continue in the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2233
  // normal locking code.
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  2234
  load_klass(temp_reg, obj_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2235
  ld(temp_reg, in_bytes(Klass::prototype_header_offset()), temp_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2236
  andi(temp2_reg, mark_reg, markOopDesc::age_mask_in_place);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2237
  orr(temp_reg, temp_reg, temp2_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2238
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2239
  assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2240
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2241
  // CmpxchgX sets cr_reg to cmpX(temp2_reg, mark_reg).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2242
  cmpxchgd(/*flag=*/cr_reg, /*current_value=*/temp2_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2243
                 /*compare_value=*/mark_reg, /*exchange_value=*/temp_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2244
                 /*where=*/obj_reg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2245
                 MacroAssembler::MemBarAcq,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2246
                 MacroAssembler::cmpxchgx_hint_acquire_lock());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2247
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2248
  // reload markOop in mark_reg before continuing with lightweight locking
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2249
  ld(mark_reg, oopDesc::mark_offset_in_bytes(), obj_reg);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2250
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2251
  // Fall through to the normal CAS-based lock, because no matter what
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2252
  // the result of the above CAS, some thread must have succeeded in
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2253
  // removing the bias bit from the object's header.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2254
  if (PrintBiasedLockingStatistics) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2255
    Label l;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2256
    bne(cr_reg, l);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2257
    load_const(temp2_reg, (address) BiasedLocking::revoked_lock_entry_count_addr(), temp_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2258
    lwzx(temp_reg, temp2_reg);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2259
    addi(temp_reg, temp_reg, 1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2260
    stwx(temp_reg, temp2_reg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2261
    bind(l);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2262
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2263
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2264
  bind(cas_label);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2265
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2266
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2267
void MacroAssembler::biased_locking_exit (ConditionRegister cr_reg, Register mark_addr, Register temp_reg, Label& done) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2268
  // Check for biased locking unlock case, which is a no-op
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2269
  // Note: we do not have to check the thread ID for two reasons.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2270
  // First, the interpreter checks for IllegalMonitorStateException at
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2271
  // a higher level. Second, if the bias was revoked while we held the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2272
  // lock, the object could not be rebiased toward another thread, so
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2273
  // the bias bit would be clear.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2274
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2275
  ld(temp_reg, 0, mark_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2276
  andi(temp_reg, temp_reg, markOopDesc::biased_lock_mask_in_place);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2277
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2278
  cmpwi(cr_reg, temp_reg, markOopDesc::biased_lock_pattern);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2279
  beq(cr_reg, done);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2280
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2281
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2282
// allocation (for C1)
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2283
void MacroAssembler::eden_allocate(
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2284
  Register obj,                      // result: pointer to object after successful allocation
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2285
  Register var_size_in_bytes,        // object size in bytes if unknown at compile time; invalid otherwise
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2286
  int      con_size_in_bytes,        // object size in bytes if   known at compile time
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2287
  Register t1,                       // temp register
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2288
  Register t2,                       // temp register
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2289
  Label&   slow_case                 // continuation point if fast allocation fails
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2290
) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2291
  b(slow_case);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2292
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2293
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2294
void MacroAssembler::tlab_allocate(
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2295
  Register obj,                      // result: pointer to object after successful allocation
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2296
  Register var_size_in_bytes,        // object size in bytes if unknown at compile time; invalid otherwise
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2297
  int      con_size_in_bytes,        // object size in bytes if   known at compile time
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2298
  Register t1,                       // temp register
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2299
  Label&   slow_case                 // continuation point if fast allocation fails
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2300
) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2301
  // make sure arguments make sense
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2302
  assert_different_registers(obj, var_size_in_bytes, t1);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2303
  assert(0 <= con_size_in_bytes && is_simm13(con_size_in_bytes), "illegal object size");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2304
  assert((con_size_in_bytes & MinObjAlignmentInBytesMask) == 0, "object size is not multiple of alignment");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2305
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2306
  const Register new_top = t1;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2307
  //verify_tlab(); not implemented
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2308
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2309
  ld(obj, in_bytes(JavaThread::tlab_top_offset()), R16_thread);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2310
  ld(R0, in_bytes(JavaThread::tlab_end_offset()), R16_thread);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2311
  if (var_size_in_bytes == noreg) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2312
    addi(new_top, obj, con_size_in_bytes);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2313
  } else {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2314
    add(new_top, obj, var_size_in_bytes);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2315
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2316
  cmpld(CCR0, new_top, R0);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2317
  bc_far_optimized(Assembler::bcondCRbiIs1, bi0(CCR0, Assembler::greater), slow_case);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2318
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2319
#ifdef ASSERT
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2320
  // make sure new free pointer is properly aligned
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2321
  {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2322
    Label L;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2323
    andi_(R0, new_top, MinObjAlignmentInBytesMask);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2324
    beq(CCR0, L);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2325
    stop("updated TLAB free is not properly aligned", 0x934);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2326
    bind(L);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2327
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2328
#endif // ASSERT
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2329
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2330
  // update the tlab top pointer
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2331
  std(new_top, in_bytes(JavaThread::tlab_top_offset()), R16_thread);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2332
  //verify_tlab(); not implemented
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2333
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2334
void MacroAssembler::tlab_refill(Label& retry_tlab, Label& try_eden, Label& slow_case) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2335
  unimplemented("tlab_refill");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2336
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2337
void MacroAssembler::incr_allocated_bytes(RegisterOrConstant size_in_bytes, Register t1, Register t2) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2338
  unimplemented("incr_allocated_bytes");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2339
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2340
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2341
address MacroAssembler::emit_trampoline_stub(int destination_toc_offset,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2342
                                             int insts_call_instruction_offset, Register Rtoc) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2343
  // Start the stub.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2344
  address stub = start_a_stub(64);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2345
  if (stub == NULL) { return NULL; } // CodeCache full: bail out
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2346
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2347
  // Create a trampoline stub relocation which relates this trampoline stub
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2348
  // with the call instruction at insts_call_instruction_offset in the
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2349
  // instructions code-section.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2350
  relocate(trampoline_stub_Relocation::spec(code()->insts()->start() + insts_call_instruction_offset));
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2351
  const int stub_start_offset = offset();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2352
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2353
  // For java_to_interp stubs we use R11_scratch1 as scratch register
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2354
  // and in call trampoline stubs we use R12_scratch2. This way we
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2355
  // can distinguish them (see is_NativeCallTrampolineStub_at()).
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2356
  Register reg_scratch = R12_scratch2;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2357
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2358
  // Now, create the trampoline stub's code:
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2359
  // - load the TOC
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2360
  // - load the call target from the constant pool
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2361
  // - call
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2362
  if (Rtoc == noreg) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2363
    calculate_address_from_global_toc(reg_scratch, method_toc());
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2364
    Rtoc = reg_scratch;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2365
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2366
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2367
  ld_largeoffset_unchecked(reg_scratch, destination_toc_offset, Rtoc, false);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2368
  mtctr(reg_scratch);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2369
  bctr();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2370
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2371
  const address stub_start_addr = addr_at(stub_start_offset);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2372
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2373
  // Assert that the encoded destination_toc_offset can be identified and that it is correct.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2374
  assert(destination_toc_offset == NativeCallTrampolineStub_at(stub_start_addr)->destination_toc_offset(),
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2375
         "encoded offset into the constant pool must match");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2376
  // Trampoline_stub_size should be good.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2377
  assert((uint)(offset() - stub_start_offset) <= trampoline_stub_size, "should be good size");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2378
  assert(is_NativeCallTrampolineStub_at(stub_start_addr), "doesn't look like a trampoline");
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2379
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2380
  // End the stub.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2381
  end_a_stub();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2382
  return stub;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2383
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2384
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2385
// TM on PPC64.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2386
void MacroAssembler::atomic_inc_ptr(Register addr, Register result, int simm16) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2387
  Label retry;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2388
  bind(retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2389
  ldarx(result, addr, /*hint*/ false);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2390
  addi(result, result, simm16);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2391
  stdcx_(result, addr);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2392
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2393
    bne_predict_not_taken(CCR0, retry); // stXcx_ sets CCR0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2394
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2395
    bne(                  CCR0, retry); // stXcx_ sets CCR0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2396
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2397
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2398
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2399
void MacroAssembler::atomic_ori_int(Register addr, Register result, int uimm16) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2400
  Label retry;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2401
  bind(retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2402
  lwarx(result, addr, /*hint*/ false);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2403
  ori(result, result, uimm16);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2404
  stwcx_(result, addr);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2405
  if (UseStaticBranchPredictionInCompareAndSwapPPC64) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2406
    bne_predict_not_taken(CCR0, retry); // stXcx_ sets CCR0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2407
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2408
    bne(                  CCR0, retry); // stXcx_ sets CCR0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2409
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2410
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2411
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2412
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2413
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2414
// Update rtm_counters based on abort status
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2415
// input: abort_status
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2416
//        rtm_counters (RTMLockingCounters*)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2417
void MacroAssembler::rtm_counters_update(Register abort_status, Register rtm_counters_Reg) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2418
  // Mapping to keep PreciseRTMLockingStatistics similar to x86.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2419
  // x86 ppc (! means inverted, ? means not the same)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2420
  //  0   31  Set if abort caused by XABORT instruction.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2421
  //  1  ! 7  If set, the transaction may succeed on a retry. This bit is always clear if bit 0 is set.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2422
  //  2   13  Set if another logical processor conflicted with a memory address that was part of the transaction that aborted.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2423
  //  3   10  Set if an internal buffer overflowed.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2424
  //  4  ?12  Set if a debug breakpoint was hit.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2425
  //  5  ?32  Set if an abort occurred during execution of a nested transaction.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2426
  const  int tm_failure_bit[] = {Assembler::tm_tabort, // Note: Seems like signal handler sets this, too.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2427
                                 Assembler::tm_failure_persistent, // inverted: transient
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2428
                                 Assembler::tm_trans_cf,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2429
                                 Assembler::tm_footprint_of,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2430
                                 Assembler::tm_non_trans_cf,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2431
                                 Assembler::tm_suspended};
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2432
  const bool tm_failure_inv[] = {false, true, false, false, false, false};
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2433
  assert(sizeof(tm_failure_bit)/sizeof(int) == RTMLockingCounters::ABORT_STATUS_LIMIT, "adapt mapping!");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2434
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2435
  const Register addr_Reg = R0;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2436
  // Keep track of offset to where rtm_counters_Reg had pointed to.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2437
  int counters_offs = RTMLockingCounters::abort_count_offset();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2438
  addi(addr_Reg, rtm_counters_Reg, counters_offs);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2439
  const Register temp_Reg = rtm_counters_Reg;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2440
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2441
  //atomic_inc_ptr(addr_Reg, temp_Reg); We don't increment atomically
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2442
  ldx(temp_Reg, addr_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2443
  addi(temp_Reg, temp_Reg, 1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2444
  stdx(temp_Reg, addr_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2445
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2446
  if (PrintPreciseRTMLockingStatistics) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2447
    int counters_offs_delta = RTMLockingCounters::abortX_count_offset() - counters_offs;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2448
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2449
    //mftexasr(abort_status); done by caller
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2450
    for (int i = 0; i < RTMLockingCounters::ABORT_STATUS_LIMIT; i++) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2451
      counters_offs += counters_offs_delta;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2452
      li(temp_Reg, counters_offs_delta); // can't use addi with R0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2453
      add(addr_Reg, addr_Reg, temp_Reg); // point to next counter
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2454
      counters_offs_delta = sizeof(uintx);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2455
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2456
      Label check_abort;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2457
      rldicr_(temp_Reg, abort_status, tm_failure_bit[i], 0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2458
      if (tm_failure_inv[i]) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2459
        bne(CCR0, check_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2460
      } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2461
        beq(CCR0, check_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2462
      }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2463
      //atomic_inc_ptr(addr_Reg, temp_Reg); We don't increment atomically
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2464
      ldx(temp_Reg, addr_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2465
      addi(temp_Reg, temp_Reg, 1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2466
      stdx(temp_Reg, addr_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2467
      bind(check_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2468
    }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2469
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2470
  li(temp_Reg, -counters_offs); // can't use addi with R0
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2471
  add(rtm_counters_Reg, addr_Reg, temp_Reg); // restore
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2472
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2473
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2474
// Branch if (random & (count-1) != 0), count is 2^n
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2475
// tmp and CR0 are killed
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2476
void MacroAssembler::branch_on_random_using_tb(Register tmp, int count, Label& brLabel) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2477
  mftb(tmp);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2478
  andi_(tmp, tmp, count-1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2479
  bne(CCR0, brLabel);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2480
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2481
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2482
// Perform abort ratio calculation, set no_rtm bit if high ratio.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2483
// input:  rtm_counters_Reg (RTMLockingCounters* address) - KILLED
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2484
void MacroAssembler::rtm_abort_ratio_calculation(Register rtm_counters_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2485
                                                 RTMLockingCounters* rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2486
                                                 Metadata* method_data) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2487
  Label L_done, L_check_always_rtm1, L_check_always_rtm2;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2488
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2489
  if (RTMLockingCalculationDelay > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2490
    // Delay calculation.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2491
    ld(rtm_counters_Reg, (RegisterOrConstant)(intptr_t)RTMLockingCounters::rtm_calculation_flag_addr());
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2492
    cmpdi(CCR0, rtm_counters_Reg, 0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2493
    beq(CCR0, L_done);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2494
    load_const_optimized(rtm_counters_Reg, (address)rtm_counters, R0); // reload
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2495
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2496
  // Abort ratio calculation only if abort_count > RTMAbortThreshold.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2497
  //   Aborted transactions = abort_count * 100
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2498
  //   All transactions = total_count *  RTMTotalCountIncrRate
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2499
  //   Set no_rtm bit if (Aborted transactions >= All transactions * RTMAbortRatio)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2500
  ld(R0, RTMLockingCounters::abort_count_offset(), rtm_counters_Reg);
46494
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2501
  if (is_simm(RTMAbortThreshold, 16)) {   // cmpdi can handle 16bit immediate only.
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2502
    cmpdi(CCR0, R0, RTMAbortThreshold);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2503
    blt(CCR0, L_check_always_rtm2);  // reload of rtm_counters_Reg not necessary
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2504
  } else {
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2505
    load_const_optimized(rtm_counters_Reg, RTMAbortThreshold);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2506
    cmpd(CCR0, R0, rtm_counters_Reg);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2507
    blt(CCR0, L_check_always_rtm1);  // reload of rtm_counters_Reg required
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2508
  }
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2509
  mulli(R0, R0, 100);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2510
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2511
  const Register tmpReg = rtm_counters_Reg;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2512
  ld(tmpReg, RTMLockingCounters::total_count_offset(), rtm_counters_Reg);
46494
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2513
  mulli(tmpReg, tmpReg, RTMTotalCountIncrRate); // allowable range: int16
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2514
  mulli(tmpReg, tmpReg, RTMAbortRatio);         // allowable range: int16
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2515
  cmpd(CCR0, R0, tmpReg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2516
  blt(CCR0, L_check_always_rtm1); // jump to reload
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2517
  if (method_data != NULL) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2518
    // Set rtm_state to "no rtm" in MDO.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2519
    // Not using a metadata relocation. Method and Class Loader are kept alive anyway.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2520
    // (See nmethod::metadata_do and CodeBuffer::finalize_oop_references.)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2521
    load_const(R0, (address)method_data + MethodData::rtm_state_offset_in_bytes(), tmpReg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2522
    atomic_ori_int(R0, tmpReg, NoRTM);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2523
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2524
  b(L_done);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2525
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2526
  bind(L_check_always_rtm1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2527
  load_const_optimized(rtm_counters_Reg, (address)rtm_counters, R0); // reload
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2528
  bind(L_check_always_rtm2);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2529
  ld(tmpReg, RTMLockingCounters::total_count_offset(), rtm_counters_Reg);
46494
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2530
  int64_t thresholdValue = RTMLockingThreshold / RTMTotalCountIncrRate;
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2531
  if (is_simm(thresholdValue, 16)) {   // cmpdi can handle 16bit immediate only.
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2532
    cmpdi(CCR0, tmpReg, thresholdValue);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2533
  } else {
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2534
    load_const_optimized(R0, thresholdValue);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2535
    cmpd(CCR0, tmpReg, R0);
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2536
  }
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2537
  blt(CCR0, L_done);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2538
  if (method_data != NULL) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2539
    // Set rtm_state to "always rtm" in MDO.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2540
    // Not using a metadata relocation. See above.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2541
    load_const(R0, (address)method_data + MethodData::rtm_state_offset_in_bytes(), tmpReg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2542
    atomic_ori_int(R0, tmpReg, UseRTM);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2543
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2544
  bind(L_done);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2545
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2546
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2547
// Update counters and perform abort ratio calculation.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2548
// input: abort_status_Reg
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2549
void MacroAssembler::rtm_profiling(Register abort_status_Reg, Register temp_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2550
                                   RTMLockingCounters* rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2551
                                   Metadata* method_data,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2552
                                   bool profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2553
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2554
  assert(rtm_counters != NULL, "should not be NULL when profiling RTM");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2555
  // Update rtm counters based on state at abort.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2556
  // Reads abort_status_Reg, updates flags.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2557
  assert_different_registers(abort_status_Reg, temp_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2558
  load_const_optimized(temp_Reg, (address)rtm_counters, R0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2559
  rtm_counters_update(abort_status_Reg, temp_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2560
  if (profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2561
    assert(rtm_counters != NULL, "should not be NULL when profiling RTM");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2562
    rtm_abort_ratio_calculation(temp_Reg, rtm_counters, method_data);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2563
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2564
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2565
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2566
// Retry on abort if abort's status indicates non-persistent failure.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2567
// inputs: retry_count_Reg
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2568
//       : abort_status_Reg
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2569
// output: retry_count_Reg decremented by 1
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2570
void MacroAssembler::rtm_retry_lock_on_abort(Register retry_count_Reg, Register abort_status_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2571
                                             Label& retryLabel, Label* checkRetry) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2572
  Label doneRetry;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2573
  rldicr_(R0, abort_status_Reg, tm_failure_persistent, 0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2574
  bne(CCR0, doneRetry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2575
  if (checkRetry) { bind(*checkRetry); }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2576
  addic_(retry_count_Reg, retry_count_Reg, -1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2577
  blt(CCR0, doneRetry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2578
  smt_yield(); // Can't use wait(). No permission (SIGILL).
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2579
  b(retryLabel);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2580
  bind(doneRetry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2581
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2582
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2583
// Spin and retry if lock is busy.
43428
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2584
// inputs: owner_addr_Reg (monitor address)
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2585
//       : retry_count_Reg
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2586
// output: retry_count_Reg decremented by 1
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2587
// CTR is killed
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2588
void MacroAssembler::rtm_retry_lock_on_busy(Register retry_count_Reg, Register owner_addr_Reg, Label& retryLabel) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2589
  Label SpinLoop, doneRetry;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2590
  addic_(retry_count_Reg, retry_count_Reg, -1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2591
  blt(CCR0, doneRetry);
43428
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2592
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2593
  if (RTMSpinLoopCount > 1) {
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2594
    li(R0, RTMSpinLoopCount);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2595
    mtctr(R0);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2596
  }
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2597
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2598
  bind(SpinLoop);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2599
  smt_yield(); // Can't use waitrsv(). No permission (SIGILL).
43428
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2600
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2601
  if (RTMSpinLoopCount > 1) {
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2602
    bdz(retryLabel);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2603
    ld(R0, 0, owner_addr_Reg);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2604
    cmpdi(CCR0, R0, 0);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2605
    bne(CCR0, SpinLoop);
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2606
  }
3dccc891c216 8171266: PPC64: Add support to -XX:RTMSpinLoopCount=0
gromero
parents: 42661
diff changeset
  2607
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2608
  b(retryLabel);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2609
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2610
  bind(doneRetry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2611
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2612
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2613
// Use RTM for normal stack locks.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2614
// Input: objReg (object to lock)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2615
void MacroAssembler::rtm_stack_locking(ConditionRegister flag,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2616
                                       Register obj, Register mark_word, Register tmp,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2617
                                       Register retry_on_abort_count_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2618
                                       RTMLockingCounters* stack_rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2619
                                       Metadata* method_data, bool profile_rtm,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2620
                                       Label& DONE_LABEL, Label& IsInflated) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2621
  assert(UseRTMForStackLocks, "why call this otherwise?");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2622
  assert(!UseBiasedLocking, "Biased locking is not supported with RTM locking");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2623
  Label L_rtm_retry, L_decrement_retry, L_on_abort;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2624
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2625
  if (RTMRetryCount > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2626
    load_const_optimized(retry_on_abort_count_Reg, RTMRetryCount); // Retry on abort
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2627
    bind(L_rtm_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2628
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2629
  andi_(R0, mark_word, markOopDesc::monitor_value);  // inflated vs stack-locked|neutral|biased
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2630
  bne(CCR0, IsInflated);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2631
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2632
  if (PrintPreciseRTMLockingStatistics || profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2633
    Label L_noincrement;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2634
    if (RTMTotalCountIncrRate > 1) {
46494
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2635
      branch_on_random_using_tb(tmp, RTMTotalCountIncrRate, L_noincrement);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2636
    }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2637
    assert(stack_rtm_counters != NULL, "should not be NULL when profiling RTM");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2638
    load_const_optimized(tmp, (address)stack_rtm_counters->total_count_addr(), R0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2639
    //atomic_inc_ptr(tmp, /*temp, will be reloaded*/mark_word); We don't increment atomically
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2640
    ldx(mark_word, tmp);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2641
    addi(mark_word, mark_word, 1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2642
    stdx(mark_word, tmp);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2643
    bind(L_noincrement);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2644
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2645
  tbegin_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2646
  beq(CCR0, L_on_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2647
  ld(mark_word, oopDesc::mark_offset_in_bytes(), obj);         // Reload in transaction, conflicts need to be tracked.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2648
  andi(R0, mark_word, markOopDesc::biased_lock_mask_in_place); // look at 3 lock bits
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2649
  cmpwi(flag, R0, markOopDesc::unlocked_value);                // bits = 001 unlocked
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2650
  beq(flag, DONE_LABEL);                                       // all done if unlocked
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2651
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2652
  if (UseRTMXendForLockBusy) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2653
    tend_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2654
    b(L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2655
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2656
    tabort_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2657
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2658
  bind(L_on_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2659
  const Register abort_status_Reg = tmp;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2660
  mftexasr(abort_status_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2661
  if (PrintPreciseRTMLockingStatistics || profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2662
    rtm_profiling(abort_status_Reg, /*temp*/mark_word, stack_rtm_counters, method_data, profile_rtm);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2663
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2664
  ld(mark_word, oopDesc::mark_offset_in_bytes(), obj); // reload
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2665
  if (RTMRetryCount > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2666
    // Retry on lock abort if abort status is not permanent.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2667
    rtm_retry_lock_on_abort(retry_on_abort_count_Reg, abort_status_Reg, L_rtm_retry, &L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2668
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2669
    bind(L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2670
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2671
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2672
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2673
// Use RTM for inflating locks
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2674
// inputs: obj       (object to lock)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2675
//         mark_word (current header - KILLED)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2676
//         boxReg    (on-stack box address (displaced header location) - KILLED)
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2677
void MacroAssembler::rtm_inflated_locking(ConditionRegister flag,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2678
                                          Register obj, Register mark_word, Register boxReg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2679
                                          Register retry_on_busy_count_Reg, Register retry_on_abort_count_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2680
                                          RTMLockingCounters* rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2681
                                          Metadata* method_data, bool profile_rtm,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2682
                                          Label& DONE_LABEL) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2683
  assert(UseRTMLocking, "why call this otherwise?");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2684
  Label L_rtm_retry, L_decrement_retry, L_on_abort;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2685
  // Clean monitor_value bit to get valid pointer.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2686
  int owner_offset = ObjectMonitor::owner_offset_in_bytes() - markOopDesc::monitor_value;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2687
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2688
  // Store non-null, using boxReg instead of (intptr_t)markOopDesc::unused_mark().
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2689
  std(boxReg, BasicLock::displaced_header_offset_in_bytes(), boxReg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2690
  const Register tmpReg = boxReg;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2691
  const Register owner_addr_Reg = mark_word;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2692
  addi(owner_addr_Reg, mark_word, owner_offset);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2693
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2694
  if (RTMRetryCount > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2695
    load_const_optimized(retry_on_busy_count_Reg, RTMRetryCount);  // Retry on lock busy.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2696
    load_const_optimized(retry_on_abort_count_Reg, RTMRetryCount); // Retry on abort.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2697
    bind(L_rtm_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2698
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2699
  if (PrintPreciseRTMLockingStatistics || profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2700
    Label L_noincrement;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2701
    if (RTMTotalCountIncrRate > 1) {
46494
3fdd343bc5ea 8180612: [ppc] assert failure in cpu/ppc/vm/assembler_ppc.hpp due to immediate value out of range
lucy
parents: 46369
diff changeset
  2702
      branch_on_random_using_tb(R0, RTMTotalCountIncrRate, L_noincrement);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2703
    }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2704
    assert(rtm_counters != NULL, "should not be NULL when profiling RTM");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2705
    load_const(R0, (address)rtm_counters->total_count_addr(), tmpReg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2706
    //atomic_inc_ptr(R0, tmpReg); We don't increment atomically
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2707
    ldx(tmpReg, R0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2708
    addi(tmpReg, tmpReg, 1);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2709
    stdx(tmpReg, R0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2710
    bind(L_noincrement);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2711
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2712
  tbegin_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2713
  beq(CCR0, L_on_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2714
  // We don't reload mark word. Will only be reset at safepoint.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2715
  ld(R0, 0, owner_addr_Reg); // Load in transaction, conflicts need to be tracked.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2716
  cmpdi(flag, R0, 0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2717
  beq(flag, DONE_LABEL);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2718
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2719
  if (UseRTMXendForLockBusy) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2720
    tend_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2721
    b(L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2722
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2723
    tabort_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2724
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2725
  bind(L_on_abort);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2726
  const Register abort_status_Reg = tmpReg;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2727
  mftexasr(abort_status_Reg);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2728
  if (PrintPreciseRTMLockingStatistics || profile_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2729
    rtm_profiling(abort_status_Reg, /*temp*/ owner_addr_Reg, rtm_counters, method_data, profile_rtm);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2730
    // Restore owner_addr_Reg
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2731
    ld(mark_word, oopDesc::mark_offset_in_bytes(), obj);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2732
#ifdef ASSERT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2733
    andi_(R0, mark_word, markOopDesc::monitor_value);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2734
    asm_assert_ne("must be inflated", 0xa754); // Deflating only allowed at safepoint.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2735
#endif
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2736
    addi(owner_addr_Reg, mark_word, owner_offset);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2737
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2738
  if (RTMRetryCount > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2739
    // Retry on lock abort if abort status is not permanent.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2740
    rtm_retry_lock_on_abort(retry_on_abort_count_Reg, abort_status_Reg, L_rtm_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2741
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2742
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2743
  // Appears unlocked - try to swing _owner from null to non-null.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2744
  cmpxchgd(flag, /*current val*/ R0, (intptr_t)0, /*new val*/ R16_thread, owner_addr_Reg,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2745
           MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2746
           MacroAssembler::cmpxchgx_hint_acquire_lock(), noreg, &L_decrement_retry, true);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2747
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2748
  if (RTMRetryCount > 0) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2749
    // success done else retry
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2750
    b(DONE_LABEL);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2751
    bind(L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2752
    // Spin and retry if lock is busy.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2753
    rtm_retry_lock_on_busy(retry_on_busy_count_Reg, owner_addr_Reg, L_rtm_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2754
  } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2755
    bind(L_decrement_retry);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2756
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2757
}
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2758
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2759
#endif //  INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2760
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2761
// "The box" is the space on the stack where we copy the object mark.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2762
void MacroAssembler::compiler_fast_lock_object(ConditionRegister flag, Register oop, Register box,
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2763
                                               Register temp, Register displaced_header, Register current_header,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2764
                                               bool try_bias,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2765
                                               RTMLockingCounters* rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2766
                                               RTMLockingCounters* stack_rtm_counters,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2767
                                               Metadata* method_data,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2768
                                               bool use_rtm, bool profile_rtm) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2769
  assert_different_registers(oop, box, temp, displaced_header, current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2770
  assert(flag != CCR0, "bad condition register");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2771
  Label cont;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2772
  Label object_has_monitor;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2773
  Label cas_failed;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2774
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2775
  // Load markOop from object into displaced_header.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2776
  ld(displaced_header, oopDesc::mark_offset_in_bytes(), oop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2777
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2778
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2779
  // Always do locking in runtime.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2780
  if (EmitSync & 0x01) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2781
    cmpdi(flag, oop, 0); // Oop can't be 0 here => always false.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2782
    return;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2783
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2784
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2785
  if (try_bias) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2786
    biased_locking_enter(flag, oop, displaced_header, temp, current_header, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2787
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2788
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2789
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2790
  if (UseRTMForStackLocks && use_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2791
    rtm_stack_locking(flag, oop, displaced_header, temp, /*temp*/ current_header,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2792
                      stack_rtm_counters, method_data, profile_rtm,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2793
                      cont, object_has_monitor);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2794
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2795
#endif // INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2796
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2797
  // Handle existing monitor.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2798
  if ((EmitSync & 0x02) == 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2799
    // The object has an existing monitor iff (mark & monitor_value) != 0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2800
    andi_(temp, displaced_header, markOopDesc::monitor_value);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2801
    bne(CCR0, object_has_monitor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2802
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2803
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2804
  // Set displaced_header to be (markOop of object | UNLOCK_VALUE).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2805
  ori(displaced_header, displaced_header, markOopDesc::unlocked_value);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2806
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2807
  // Load Compare Value application register.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2808
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2809
  // Initialize the box. (Must happen before we update the object mark!)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2810
  std(displaced_header, BasicLock::displaced_header_offset_in_bytes(), box);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2811
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2812
  // Must fence, otherwise, preceding store(s) may float below cmpxchg.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2813
  // Compare object markOop with mark and if equal exchange scratch1 with object markOop.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2814
  cmpxchgd(/*flag=*/flag,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2815
           /*current_value=*/current_header,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2816
           /*compare_value=*/displaced_header,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2817
           /*exchange_value=*/box,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2818
           /*where=*/oop,
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2819
           MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq,
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2820
           MacroAssembler::cmpxchgx_hint_acquire_lock(),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2821
           noreg,
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2822
           &cas_failed,
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2823
           /*check without membar and ldarx first*/true);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2824
  assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2825
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2826
  // If the compare-and-exchange succeeded, then we found an unlocked
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2827
  // object and we have now locked it.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2828
  b(cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2829
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2830
  bind(cas_failed);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2831
  // We did not see an unlocked object so try the fast recursive case.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2832
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2833
  // Check if the owner is self by comparing the value in the markOop of object
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2834
  // (current_header) with the stack pointer.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2835
  sub(current_header, current_header, R1_SP);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  2836
  load_const_optimized(temp, ~(os::vm_page_size()-1) | markOopDesc::lock_mask_in_place);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2837
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2838
  and_(R0/*==0?*/, current_header, temp);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2839
  // If condition is true we are cont and hence we can store 0 as the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2840
  // displaced header in the box, which indicates that it is a recursive lock.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2841
  mcrf(flag,CCR0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2842
  std(R0/*==0, perhaps*/, BasicLock::displaced_header_offset_in_bytes(), box);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2843
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2844
  // Handle existing monitor.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2845
  if ((EmitSync & 0x02) == 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2846
    b(cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2847
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2848
    bind(object_has_monitor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2849
    // The object's monitor m is unlocked iff m->owner == NULL,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2850
    // otherwise m->owner may contain a thread or a stack address.
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2851
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2852
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2853
    // Use the same RTM locking code in 32- and 64-bit VM.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2854
    if (use_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2855
      rtm_inflated_locking(flag, oop, displaced_header, box, temp, /*temp*/ current_header,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2856
                           rtm_counters, method_data, profile_rtm, cont);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2857
    } else {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2858
#endif // INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2859
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2860
    // Try to CAS m->owner from NULL to current thread.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2861
    addi(temp, displaced_header, ObjectMonitor::owner_offset_in_bytes()-markOopDesc::monitor_value);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2862
    cmpxchgd(/*flag=*/flag,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2863
             /*current_value=*/current_header,
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2864
             /*compare_value=*/(intptr_t)0,
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2865
             /*exchange_value=*/R16_thread,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2866
             /*where=*/temp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2867
             MacroAssembler::MemBarRel | MacroAssembler::MemBarAcq,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2868
             MacroAssembler::cmpxchgx_hint_acquire_lock());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2869
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2870
    // Store a non-null value into the box.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2871
    std(box, BasicLock::displaced_header_offset_in_bytes(), box);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2872
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2873
#   ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2874
    bne(flag, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2875
    // We have acquired the monitor, check some invariants.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2876
    addi(/*monitor=*/temp, temp, -ObjectMonitor::owner_offset_in_bytes());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2877
    // Invariant 1: _recursions should be 0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2878
    //assert(ObjectMonitor::recursions_size_in_bytes() == 8, "unexpected size");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2879
    asm_assert_mem8_is_zero(ObjectMonitor::recursions_offset_in_bytes(), temp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2880
                            "monitor->_recursions should be 0", -1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2881
    // Invariant 2: OwnerIsThread shouldn't be 0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2882
    //assert(ObjectMonitor::OwnerIsThread_size_in_bytes() == 4, "unexpected size");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2883
    //asm_assert_mem4_isnot_zero(ObjectMonitor::OwnerIsThread_offset_in_bytes(), temp,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2884
    //                           "monitor->OwnerIsThread shouldn't be 0", -1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2885
#   endif
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2886
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2887
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2888
    } // use_rtm()
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2889
#endif
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2890
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2891
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2892
  bind(cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2893
  // flag == EQ indicates success
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2894
  // flag == NE indicates failure
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2895
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2896
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2897
void MacroAssembler::compiler_fast_unlock_object(ConditionRegister flag, Register oop, Register box,
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2898
                                                 Register temp, Register displaced_header, Register current_header,
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2899
                                                 bool try_bias, bool use_rtm) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2900
  assert_different_registers(oop, box, temp, displaced_header, current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2901
  assert(flag != CCR0, "bad condition register");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2902
  Label cont;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2903
  Label object_has_monitor;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2904
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2905
  // Always do locking in runtime.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2906
  if (EmitSync & 0x01) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2907
    cmpdi(flag, oop, 0); // Oop can't be 0 here => always false.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2908
    return;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2909
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2910
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2911
  if (try_bias) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2912
    biased_locking_exit(flag, oop, current_header, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2913
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2914
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2915
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2916
  if (UseRTMForStackLocks && use_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2917
    assert(!UseBiasedLocking, "Biased locking is not supported with RTM locking");
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2918
    Label L_regular_unlock;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2919
    ld(current_header, oopDesc::mark_offset_in_bytes(), oop);         // fetch markword
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2920
    andi(R0, current_header, markOopDesc::biased_lock_mask_in_place); // look at 3 lock bits
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2921
    cmpwi(flag, R0, markOopDesc::unlocked_value);                     // bits = 001 unlocked
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2922
    bne(flag, L_regular_unlock);                                      // else RegularLock
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2923
    tend_();                                                          // otherwise end...
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2924
    b(cont);                                                          // ... and we're done
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2925
    bind(L_regular_unlock);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2926
  }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2927
#endif
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2928
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2929
  // Find the lock address and load the displaced header from the stack.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2930
  ld(displaced_header, BasicLock::displaced_header_offset_in_bytes(), box);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2931
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2932
  // If the displaced header is 0, we have a recursive unlock.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2933
  cmpdi(flag, displaced_header, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2934
  beq(flag, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2935
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2936
  // Handle existing monitor.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2937
  if ((EmitSync & 0x02) == 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2938
    // The object has an existing monitor iff (mark & monitor_value) != 0.
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2939
    RTM_OPT_ONLY( if (!(UseRTMForStackLocks && use_rtm)) ) // skip load if already done
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2940
    ld(current_header, oopDesc::mark_offset_in_bytes(), oop);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2941
    andi_(R0, current_header, markOopDesc::monitor_value);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2942
    bne(CCR0, object_has_monitor);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2943
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2944
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2945
  // Check if it is still a light weight lock, this is is true if we see
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2946
  // the stack address of the basicLock in the markOop of the object.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2947
  // Cmpxchg sets flag to cmpd(current_header, box).
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2948
  cmpxchgd(/*flag=*/flag,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2949
           /*current_value=*/current_header,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2950
           /*compare_value=*/box,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2951
           /*exchange_value=*/displaced_header,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2952
           /*where=*/oop,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2953
           MacroAssembler::MemBarRel,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2954
           MacroAssembler::cmpxchgx_hint_release_lock(),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2955
           noreg,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2956
           &cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2957
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2958
  assert(oopDesc::mark_offset_in_bytes() == 0, "offset of _mark is not 0");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2959
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2960
  // Handle existing monitor.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2961
  if ((EmitSync & 0x02) == 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2962
    b(cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2963
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2964
    bind(object_has_monitor);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2965
    addi(current_header, current_header, -markOopDesc::monitor_value); // monitor
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2966
    ld(temp,             ObjectMonitor::owner_offset_in_bytes(), current_header);
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2967
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2968
    // It's inflated.
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2969
#if INCLUDE_RTM_OPT
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2970
    if (use_rtm) {
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2971
      Label L_regular_inflated_unlock;
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2972
      // Clean monitor_value bit to get valid pointer
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2973
      cmpdi(flag, temp, 0);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2974
      bne(flag, L_regular_inflated_unlock);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2975
      tend_();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2976
      b(cont);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2977
      bind(L_regular_inflated_unlock);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2978
    }
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2979
#endif
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  2980
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2981
    ld(displaced_header, ObjectMonitor::recursions_offset_in_bytes(), current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2982
    xorr(temp, R16_thread, temp);      // Will be 0 if we are the owner.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2983
    orr(temp, temp, displaced_header); // Will be 0 if there are 0 recursions.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2984
    cmpdi(flag, temp, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2985
    bne(flag, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2986
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2987
    ld(temp,             ObjectMonitor::EntryList_offset_in_bytes(), current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2988
    ld(displaced_header, ObjectMonitor::cxq_offset_in_bytes(), current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2989
    orr(temp, temp, displaced_header); // Will be 0 if both are 0.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2990
    cmpdi(flag, temp, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2991
    bne(flag, cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2992
    release();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2993
    std(temp, ObjectMonitor::owner_offset_in_bytes(), current_header);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2994
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2995
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2996
  bind(cont);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2997
  // flag == EQ indicates success
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2998
  // flag == NE indicates failure
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  2999
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3000
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3001
// Write serialization page so VM thread can do a pseudo remote membar.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3002
// We use the current thread pointer to calculate a thread specific
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3003
// offset to write to within the page. This minimizes bus traffic
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3004
// due to cache line collision.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3005
void MacroAssembler::serialize_memory(Register thread, Register tmp1, Register tmp2) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3006
  srdi(tmp2, thread, os::get_serialize_page_shift_count());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3007
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3008
  int mask = os::vm_page_size() - sizeof(int);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3009
  if (Assembler::is_simm(mask, 16)) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3010
    andi(tmp2, tmp2, mask);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3011
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3012
    lis(tmp1, (int)((signed short) (mask >> 16)));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3013
    ori(tmp1, tmp1, mask & 0x0000ffff);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3014
    andr(tmp2, tmp2, tmp1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3015
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3016
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3017
  load_const(tmp1, (long) os::get_memory_serialize_page());
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3018
  release();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3019
  stwx(R0, tmp1, tmp2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3020
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3021
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3022
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3023
// GC barrier helper macros
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3024
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3025
// Write the card table byte if needed.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3026
void MacroAssembler::card_write_barrier_post(Register Rstore_addr, Register Rnew_val, Register Rtmp) {
29325
0e86e64c66e5 8069016: Add BarrierSet downcast support
kbarrett
parents: 28187
diff changeset
  3027
  CardTableModRefBS* bs =
0e86e64c66e5 8069016: Add BarrierSet downcast support
kbarrett
parents: 28187
diff changeset
  3028
    barrier_set_cast<CardTableModRefBS>(Universe::heap()->barrier_set());
32596
8feecdee3156 8072817: CardTableExtension kind() should be BarrierSet::CardTableExtension
kbarrett
parents: 31861
diff changeset
  3029
  assert(bs->kind() == BarrierSet::CardTableForRS ||
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3030
         bs->kind() == BarrierSet::CardTableExtension, "wrong barrier");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3031
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3032
  cmpdi(CCR0, Rnew_val, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3033
  asm_assert_ne("null oop not allowed", 0x321);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3034
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3035
  card_table_write(bs->byte_map_base, Rtmp, Rstore_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3036
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3037
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3038
// Write the card table byte.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3039
void MacroAssembler::card_table_write(jbyte* byte_map_base, Register Rtmp, Register Robj) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3040
  assert_different_registers(Robj, Rtmp, R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3041
  load_const_optimized(Rtmp, (address)byte_map_base, R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3042
  srdi(Robj, Robj, CardTableModRefBS::card_shift);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3043
  li(R0, 0); // dirty
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3044
  if (UseConcMarkSweepGC) membar(Assembler::StoreStore);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3045
  stbx(R0, Rtmp, Robj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3046
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3047
44406
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3048
// Kills R31 if value is a volatile register.
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3049
void MacroAssembler::resolve_jobject(Register value, Register tmp1, Register tmp2, bool needs_frame) {
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3050
  Label done;
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3051
  cmpdi(CCR0, value, 0);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3052
  beq(CCR0, done);         // Use NULL as-is.
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3053
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3054
  clrrdi(tmp1, value, JNIHandles::weak_tag_size);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3055
#if INCLUDE_ALL_GCS
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3056
  if (UseG1GC) { andi_(tmp2, value, JNIHandles::weak_tag_mask); }
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3057
#endif
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3058
  ld(value, 0, tmp1);      // Resolve (untagged) jobject.
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3059
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3060
#if INCLUDE_ALL_GCS
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3061
  if (UseG1GC) {
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3062
    Label not_weak;
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3063
    beq(CCR0, not_weak);   // Test for jweak tag.
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3064
    verify_oop(value);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3065
    g1_write_barrier_pre(noreg, // obj
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3066
                         noreg, // offset
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3067
                         value, // pre_val
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3068
                         tmp1, tmp2, needs_frame);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3069
    bind(not_weak);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3070
  }
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3071
#endif // INCLUDE_ALL_GCS
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3072
  verify_oop(value);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3073
  bind(done);
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3074
}
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3075
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3076
#if INCLUDE_ALL_GCS
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3077
// General G1 pre-barrier generator.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3078
// Goal: record the previous value if it is not null.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3079
void MacroAssembler::g1_write_barrier_pre(Register Robj, RegisterOrConstant offset, Register Rpre_val,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3080
                                          Register Rtmp1, Register Rtmp2, bool needs_frame) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3081
  Label runtime, filtered;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3082
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3083
  // Is marking active?
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3084
  if (in_bytes(SATBMarkQueue::byte_width_of_active()) == 4) {
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3085
    lwz(Rtmp1, in_bytes(JavaThread::satb_mark_queue_offset() + SATBMarkQueue::byte_offset_of_active()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3086
  } else {
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3087
    guarantee(in_bytes(SATBMarkQueue::byte_width_of_active()) == 1, "Assumption");
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3088
    lbz(Rtmp1, in_bytes(JavaThread::satb_mark_queue_offset() + SATBMarkQueue::byte_offset_of_active()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3089
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3090
  cmpdi(CCR0, Rtmp1, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3091
  beq(CCR0, filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3092
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3093
  // Do we need to load the previous value?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3094
  if (Robj != noreg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3095
    // Load the previous value...
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3096
    if (UseCompressedOops) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3097
      lwz(Rpre_val, offset, Robj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3098
    } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3099
      ld(Rpre_val, offset, Robj);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3100
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3101
    // Previous value has been loaded into Rpre_val.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3102
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3103
  assert(Rpre_val != noreg, "must have a real register");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3104
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3105
  // Is the previous value null?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3106
  cmpdi(CCR0, Rpre_val, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3107
  beq(CCR0, filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3108
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3109
  if (Robj != noreg && UseCompressedOops) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3110
    decode_heap_oop_not_null(Rpre_val);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3111
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3112
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3113
  // OK, it's not filtered, so we'll need to call enqueue. In the normal
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3114
  // case, pre_val will be a scratch G-reg, but there are some cases in
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3115
  // which it's an O-reg. In the first case, do a normal call. In the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3116
  // latter, do a save here and call the frameless version.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3117
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3118
  // Can we store original value in the thread's buffer?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3119
  // Is index == 0?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3120
  // (The index field is typed as size_t.)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3121
  const Register Rbuffer = Rtmp1, Rindex = Rtmp2;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3122
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3123
  ld(Rindex, in_bytes(JavaThread::satb_mark_queue_offset() + SATBMarkQueue::byte_offset_of_index()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3124
  cmpdi(CCR0, Rindex, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3125
  beq(CCR0, runtime); // If index == 0, goto runtime.
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3126
  ld(Rbuffer, in_bytes(JavaThread::satb_mark_queue_offset() + SATBMarkQueue::byte_offset_of_buf()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3127
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3128
  addi(Rindex, Rindex, -wordSize); // Decrement index.
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3129
  std(Rindex, in_bytes(JavaThread::satb_mark_queue_offset() + SATBMarkQueue::byte_offset_of_index()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3130
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3131
  // Record the previous value.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3132
  stdx(Rpre_val, Rbuffer, Rindex);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3133
  b(filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3134
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3135
  bind(runtime);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3136
44406
a46a6c4d1dd9 8176100: [REDO][REDO] G1 Needs pre barrier on dereference of weak JNI handles
mgerdin
parents: 44093
diff changeset
  3137
  // May need to preserve LR. Also needed if current frame is not compatible with C calling convention.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3138
  if (needs_frame) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3139
    save_LR_CR(Rtmp1);
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  3140
    push_frame_reg_args(0, Rtmp2);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3141
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3142
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3143
  if (Rpre_val->is_volatile() && Robj == noreg) mr(R31, Rpre_val); // Save pre_val across C call if it was preloaded.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3144
  call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::g1_wb_pre), Rpre_val, R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3145
  if (Rpre_val->is_volatile() && Robj == noreg) mr(Rpre_val, R31); // restore
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3146
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3147
  if (needs_frame) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3148
    pop_frame();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3149
    restore_LR_CR(Rtmp1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3150
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3151
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3152
  bind(filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3153
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3154
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3155
// General G1 post-barrier generator
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3156
// Store cross-region card.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3157
void MacroAssembler::g1_write_barrier_post(Register Rstore_addr, Register Rnew_val, Register Rtmp1, Register Rtmp2, Register Rtmp3, Label *filtered_ext) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3158
  Label runtime, filtered_int;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3159
  Label& filtered = (filtered_ext != NULL) ? *filtered_ext : filtered_int;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3160
  assert_different_registers(Rstore_addr, Rnew_val, Rtmp1, Rtmp2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3161
29325
0e86e64c66e5 8069016: Add BarrierSet downcast support
kbarrett
parents: 28187
diff changeset
  3162
  G1SATBCardTableLoggingModRefBS* bs =
0e86e64c66e5 8069016: Add BarrierSet downcast support
kbarrett
parents: 28187
diff changeset
  3163
    barrier_set_cast<G1SATBCardTableLoggingModRefBS>(Universe::heap()->barrier_set());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3164
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3165
  // Does store cross heap regions?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3166
  if (G1RSBarrierRegionFilter) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3167
    xorr(Rtmp1, Rstore_addr, Rnew_val);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3168
    srdi_(Rtmp1, Rtmp1, HeapRegion::LogOfHRGrainBytes);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3169
    beq(CCR0, filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3170
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3171
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3172
  // Crosses regions, storing NULL?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3173
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3174
  cmpdi(CCR0, Rnew_val, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3175
  asm_assert_ne("null oop not allowed (G1)", 0x322); // Checked by caller on PPC64, so following branch is obsolete:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3176
  //beq(CCR0, filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3177
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3178
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3179
  // Storing region crossing non-NULL, is card already dirty?
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3180
  assert(sizeof(*bs->byte_map_base) == sizeof(jbyte), "adjust this code");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3181
  const Register Rcard_addr = Rtmp1;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3182
  Register Rbase = Rtmp2;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3183
  load_const_optimized(Rbase, (address)bs->byte_map_base, /*temp*/ Rtmp3);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3184
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3185
  srdi(Rcard_addr, Rstore_addr, CardTableModRefBS::card_shift);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3186
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3187
  // Get the address of the card.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3188
  lbzx(/*card value*/ Rtmp3, Rbase, Rcard_addr);
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3189
  cmpwi(CCR0, Rtmp3, (int)G1SATBCardTableModRefBS::g1_young_card_val());
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3190
  beq(CCR0, filtered);
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3191
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3192
  membar(Assembler::StoreLoad);
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3193
  lbzx(/*card value*/ Rtmp3, Rbase, Rcard_addr);  // Reload after membar.
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3194
  cmpwi(CCR0, Rtmp3 /* card value */, CardTableModRefBS::dirty_card_val());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3195
  beq(CCR0, filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3196
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3197
  // Storing a region crossing, non-NULL oop, card is clean.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3198
  // Dirty card and log.
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3199
  li(Rtmp3, CardTableModRefBS::dirty_card_val());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3200
  //release(); // G1: oops are allowed to get visible after dirty marking.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3201
  stbx(Rtmp3, Rbase, Rcard_addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3202
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3203
  add(Rcard_addr, Rbase, Rcard_addr); // This is the address which needs to get enqueued.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3204
  Rbase = noreg; // end of lifetime
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3205
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3206
  const Register Rqueue_index = Rtmp2,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3207
                 Rqueue_buf   = Rtmp3;
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3208
  ld(Rqueue_index, in_bytes(JavaThread::dirty_card_queue_offset() + DirtyCardQueue::byte_offset_of_index()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3209
  cmpdi(CCR0, Rqueue_index, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3210
  beq(CCR0, runtime); // index == 0 then jump to runtime
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3211
  ld(Rqueue_buf, in_bytes(JavaThread::dirty_card_queue_offset() + DirtyCardQueue::byte_offset_of_buf()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3212
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3213
  addi(Rqueue_index, Rqueue_index, -wordSize); // decrement index
34148
6efbc7ffd767 8143014: Access PtrQueue member offsets through derived classes
kbarrett
parents: 33198
diff changeset
  3214
  std(Rqueue_index, in_bytes(JavaThread::dirty_card_queue_offset() + DirtyCardQueue::byte_offset_of_index()), R16_thread);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3215
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3216
  stdx(Rcard_addr, Rqueue_buf, Rqueue_index); // store card
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3217
  b(filtered);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3218
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3219
  bind(runtime);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3220
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3221
  // Save the live input values.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3222
  call_VM_leaf(CAST_FROM_FN_PTR(address, SharedRuntime::g1_wb_post), Rcard_addr, R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3223
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3224
  bind(filtered_int);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3225
}
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3226
#endif // INCLUDE_ALL_GCS
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3227
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3228
// Values for last_Java_pc, and last_Java_sp must comply to the rules
27012
f8fdfab4757b 8059592: Recent bugfixes in ppc64 port.
goetz
parents: 25715
diff changeset
  3229
// in frame_ppc.hpp.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3230
void MacroAssembler::set_last_Java_frame(Register last_Java_sp, Register last_Java_pc) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3231
  // Always set last_Java_pc and flags first because once last_Java_sp
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3232
  // is visible has_last_Java_frame is true and users will look at the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3233
  // rest of the fields. (Note: flags should always be zero before we
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3234
  // get here so doesn't need to be set.)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3235
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3236
  // Verify that last_Java_pc was zeroed on return to Java
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3237
  asm_assert_mem8_is_zero(in_bytes(JavaThread::last_Java_pc_offset()), R16_thread,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3238
                          "last_Java_pc not zeroed before leaving Java", 0x200);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3239
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3240
  // When returning from calling out from Java mode the frame anchor's
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3241
  // last_Java_pc will always be set to NULL. It is set here so that
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3242
  // if we are doing a call to native (not VM) that we capture the
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3243
  // known pc and don't have to rely on the native call having a
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3244
  // standard frame linkage where we can find the pc.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3245
  if (last_Java_pc != noreg)
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3246
    std(last_Java_pc, in_bytes(JavaThread::last_Java_pc_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3247
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3248
  // Set last_Java_sp last.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3249
  std(last_Java_sp, in_bytes(JavaThread::last_Java_sp_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3250
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3251
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3252
void MacroAssembler::reset_last_Java_frame(void) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3253
  asm_assert_mem8_isnot_zero(in_bytes(JavaThread::last_Java_sp_offset()),
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3254
                             R16_thread, "SP was not set, still zero", 0x202);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3255
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3256
  BLOCK_COMMENT("reset_last_Java_frame {");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3257
  li(R0, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3258
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3259
  // _last_Java_sp = 0
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3260
  std(R0, in_bytes(JavaThread::last_Java_sp_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3261
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3262
  // _last_Java_pc = 0
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3263
  std(R0, in_bytes(JavaThread::last_Java_pc_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3264
  BLOCK_COMMENT("} reset_last_Java_frame");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3265
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3266
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3267
void MacroAssembler::set_top_ijava_frame_at_SP_as_last_Java_frame(Register sp, Register tmp1) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3268
  assert_different_registers(sp, tmp1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3269
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3270
  // sp points to a TOP_IJAVA_FRAME, retrieve frame's PC via
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3271
  // TOP_IJAVA_FRAME_ABI.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3272
  // FIXME: assert that we really have a TOP_IJAVA_FRAME here!
23221
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3273
  address entry = pc();
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3274
  load_const_optimized(tmp1, entry);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3275
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3276
  set_last_Java_frame(/*sp=*/sp, /*pc=*/tmp1);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3277
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3278
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3279
void MacroAssembler::get_vm_result(Register oop_result) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3280
  // Read:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3281
  //   R16_thread
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3282
  //   R16_thread->in_bytes(JavaThread::vm_result_offset())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3283
  //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3284
  // Updated:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3285
  //   oop_result
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3286
  //   R16_thread->in_bytes(JavaThread::vm_result_offset())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3287
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3288
  verify_thread();
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3289
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3290
  ld(oop_result, in_bytes(JavaThread::vm_result_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3291
  li(R0, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3292
  std(R0, in_bytes(JavaThread::vm_result_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3293
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3294
  verify_oop(oop_result);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3295
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3296
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3297
void MacroAssembler::get_vm_result_2(Register metadata_result) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3298
  // Read:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3299
  //   R16_thread
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3300
  //   R16_thread->in_bytes(JavaThread::vm_result_2_offset())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3301
  //
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3302
  // Updated:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3303
  //   metadata_result
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3304
  //   R16_thread->in_bytes(JavaThread::vm_result_2_offset())
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3305
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3306
  ld(metadata_result, in_bytes(JavaThread::vm_result_2_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3307
  li(R0, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3308
  std(R0, in_bytes(JavaThread::vm_result_2_offset()), R16_thread);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3309
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3310
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3311
Register MacroAssembler::encode_klass_not_null(Register dst, Register src) {
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3312
  Register current = (src != noreg) ? src : dst; // Klass is in dst if no src provided.
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3313
  if (Universe::narrow_klass_base() != 0) {
23492
af5352f40e65 8037915: PPC64/AIX: Several smaller fixes
goetz
parents: 23221
diff changeset
  3314
    // Use dst as temp if it is free.
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3315
    sub_const_optimized(dst, current, Universe::narrow_klass_base(), R0);
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3316
    current = dst;
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3317
  }
22867
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3318
  if (Universe::narrow_klass_shift() != 0) {
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3319
    srdi(dst, current, Universe::narrow_klass_shift());
309bcf262a19 8031319: PPC64: Some fixes in ppc and aix coding.
goetz
parents: 22861
diff changeset
  3320
    current = dst;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3321
  }
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3322
  return current;
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3323
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3324
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3325
void MacroAssembler::store_klass(Register dst_oop, Register klass, Register ck) {
22840
e544827769a7 8027965: Adapt PPC to 8015107: NPG: Use consistent naming for metaspace concepts
goetz
parents: 22829
diff changeset
  3326
  if (UseCompressedClassPointers) {
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3327
    Register compressedKlass = encode_klass_not_null(ck, klass);
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3328
    stw(compressedKlass, oopDesc::klass_offset_in_bytes(), dst_oop);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3329
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3330
    std(klass, oopDesc::klass_offset_in_bytes(), dst_oop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3331
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3332
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3333
23221
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3334
void MacroAssembler::store_klass_gap(Register dst_oop, Register val) {
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3335
  if (UseCompressedClassPointers) {
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3336
    if (val == noreg) {
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3337
      val = R0;
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3338
      li(val, 0);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3339
    }
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3340
    stw(val, oopDesc::klass_gap_offset_in_bytes(), dst_oop); // klass gap if compressed
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3341
  }
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3342
}
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  3343
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3344
int MacroAssembler::instr_size_for_decode_klass_not_null() {
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3345
  if (!UseCompressedClassPointers) return 0;
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3346
  int num_instrs = 1;  // shift or move
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3347
  if (Universe::narrow_klass_base() != 0) num_instrs = 7;  // shift + load const + add
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3348
  return num_instrs * BytesPerInstWord;
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3349
}
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3350
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3351
void MacroAssembler::decode_klass_not_null(Register dst, Register src) {
27012
f8fdfab4757b 8059592: Recent bugfixes in ppc64 port.
goetz
parents: 25715
diff changeset
  3352
  assert(dst != R0, "Dst reg may not be R0, as R0 is used here.");
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3353
  if (src == noreg) src = dst;
22829
08b62d0e80ed 8024379: Adapt PPC64 port to 8003424
goetz
parents: 22824
diff changeset
  3354
  Register shifted_src = src;
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3355
  if (Universe::narrow_klass_shift() != 0 ||
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3356
      Universe::narrow_klass_base() == 0 && src != dst) {  // Move required.
22829
08b62d0e80ed 8024379: Adapt PPC64 port to 8003424
goetz
parents: 22824
diff changeset
  3357
    shifted_src = dst;
08b62d0e80ed 8024379: Adapt PPC64 port to 8003424
goetz
parents: 22824
diff changeset
  3358
    sldi(shifted_src, src, Universe::narrow_klass_shift());
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3359
  }
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3360
  if (Universe::narrow_klass_base() != 0) {
30303
c703c89fddbf 8077838: Recent developments for ppc.
goetz
parents: 29325
diff changeset
  3361
    add_const_optimized(dst, shifted_src, Universe::narrow_klass_base(), R0);
22843
b245fac3b6a4 8027968: Adapt PPC to 8024927: Nashorn performance regression with CompressedOops
goetz
parents: 22840
diff changeset
  3362
  }
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3363
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3364
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3365
void MacroAssembler::load_klass(Register dst, Register src) {
22840
e544827769a7 8027965: Adapt PPC to 8015107: NPG: Use consistent naming for metaspace concepts
goetz
parents: 22829
diff changeset
  3366
  if (UseCompressedClassPointers) {
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3367
    lwz(dst, oopDesc::klass_offset_in_bytes(), src);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3368
    // Attention: no null check here!
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3369
    decode_klass_not_null(dst, dst);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3370
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3371
    ld(dst, oopDesc::klass_offset_in_bytes(), src);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3372
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3373
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3374
46961
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3375
// ((OopHandle)result).resolve();
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3376
void MacroAssembler::resolve_oop_handle(Register result) {
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3377
  // OopHandle::resolve is an indirection.
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3378
  ld(result, 0, result);
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3379
}
c9094b1e5f87 8186088: ConstantPoolCache::_resolved_references is not a JNIHandle
coleenp
parents: 46789
diff changeset
  3380
42068
18c8a4d5998e 8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents: 41334
diff changeset
  3381
void MacroAssembler::load_mirror_from_const_method(Register mirror, Register const_method) {
18c8a4d5998e 8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents: 41334
diff changeset
  3382
  ld(mirror, in_bytes(ConstMethod::constants_offset()), const_method);
38074
8475fdc6dcc3 8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents: 36303
diff changeset
  3383
  ld(mirror, ConstantPool::pool_holder_offset_in_bytes(), mirror);
42068
18c8a4d5998e 8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents: 41334
diff changeset
  3384
  ld(mirror, in_bytes(Klass::java_mirror_offset()), mirror);
47580
96392e113a0a 8186777: Make Klass::_java_mirror an OopHandle
coleenp
parents: 47521
diff changeset
  3385
  resolve_oop_handle(mirror);
38074
8475fdc6dcc3 8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents: 36303
diff changeset
  3386
}
8475fdc6dcc3 8154580: Save mirror in interpreter frame to enable cleanups of CLDClosure
coleenp
parents: 36303
diff changeset
  3387
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3388
// Clear Array
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3389
// For very short arrays. tmp == R0 is allowed.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3390
void MacroAssembler::clear_memory_unrolled(Register base_ptr, int cnt_dwords, Register tmp, int offset) {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3391
  if (cnt_dwords > 0) { li(tmp, 0); }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3392
  for (int i = 0; i < cnt_dwords; ++i) { std(tmp, offset + i * 8, base_ptr); }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3393
}
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3394
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3395
// Version for constant short array length. Kills base_ptr. tmp == R0 is allowed.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3396
void MacroAssembler::clear_memory_constlen(Register base_ptr, int cnt_dwords, Register tmp) {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3397
  if (cnt_dwords < 8) {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3398
    clear_memory_unrolled(base_ptr, cnt_dwords, tmp);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3399
    return;
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3400
  }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3401
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3402
  Label loop;
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3403
  const long loopcnt   = cnt_dwords >> 1,
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3404
             remainder = cnt_dwords & 1;
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3405
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3406
  li(tmp, loopcnt);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3407
  mtctr(tmp);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3408
  li(tmp, 0);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3409
  bind(loop);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3410
    std(tmp, 0, base_ptr);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3411
    std(tmp, 8, base_ptr);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3412
    addi(base_ptr, base_ptr, 16);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3413
    bdnz(loop);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3414
  if (remainder) { std(tmp, 0, base_ptr); }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3415
}
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3416
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3417
// Kills both input registers. tmp == R0 is allowed.
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3418
void MacroAssembler::clear_memory_doubleword(Register base_ptr, Register cnt_dwords, Register tmp, long const_cnt) {
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3419
  // Procedure for large arrays (uses data cache block zero instruction).
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3420
    Label startloop, fast, fastloop, small_rest, restloop, done;
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  3421
    const int cl_size         = VM_Version::L1_data_cache_line_size(),
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3422
              cl_dwords       = cl_size >> 3,
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3423
              cl_dw_addr_bits = exact_log2(cl_dwords),
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3424
              dcbz_min        = 1,  // Min count of dcbz executions, needs to be >0.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3425
              min_cnt         = ((dcbz_min + 1) << cl_dw_addr_bits) - 1;
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3426
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3427
  if (const_cnt >= 0) {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3428
    // Constant case.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3429
    if (const_cnt < min_cnt) {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3430
      clear_memory_constlen(base_ptr, const_cnt, tmp);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3431
      return;
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3432
    }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3433
    load_const_optimized(cnt_dwords, const_cnt, tmp);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3434
  } else {
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3435
    // cnt_dwords already loaded in register. Need to check size.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3436
    cmpdi(CCR1, cnt_dwords, min_cnt); // Big enough? (ensure >= dcbz_min lines included).
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3437
    blt(CCR1, small_rest);
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3438
  }
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3439
    rldicl_(tmp, base_ptr, 64-3, 64-cl_dw_addr_bits); // Extract dword offset within first cache line.
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3440
    beq(CCR0, fast);                                  // Already 128byte aligned.
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3441
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3442
    subfic(tmp, tmp, cl_dwords);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3443
    mtctr(tmp);                        // Set ctr to hit 128byte boundary (0<ctr<cl_dwords).
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3444
    subf(cnt_dwords, tmp, cnt_dwords); // rest.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3445
    li(tmp, 0);
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3446
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3447
  bind(startloop);                     // Clear at the beginning to reach 128byte boundary.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3448
    std(tmp, 0, base_ptr);             // Clear 8byte aligned block.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3449
    addi(base_ptr, base_ptr, 8);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3450
    bdnz(startloop);
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3451
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3452
  bind(fast);                                  // Clear 128byte blocks.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3453
    srdi(tmp, cnt_dwords, cl_dw_addr_bits);    // Loop count for 128byte loop (>0).
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3454
    andi(cnt_dwords, cnt_dwords, cl_dwords-1); // Rest in dwords.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3455
    mtctr(tmp);                                // Load counter.
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3456
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3457
  bind(fastloop);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3458
    dcbz(base_ptr);                    // Clear 128byte aligned block.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3459
    addi(base_ptr, base_ptr, cl_size);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3460
    bdnz(fastloop);
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3461
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3462
  bind(small_rest);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3463
    cmpdi(CCR0, cnt_dwords, 0);        // size 0?
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3464
    beq(CCR0, done);                   // rest == 0
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3465
    li(tmp, 0);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3466
    mtctr(cnt_dwords);                 // Load counter.
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3467
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3468
  bind(restloop);                      // Clear rest.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3469
    std(tmp, 0, base_ptr);             // Clear 8byte aligned block.
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3470
    addi(base_ptr, base_ptr, 8);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3471
    bdnz(restloop);
42661
2343dd675325 8170991: PPC64: Bad code for initialization of short arrays
mdoerr
parents: 42068
diff changeset
  3472
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3473
  bind(done);
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3474
}
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  3475
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3476
/////////////////////////////////////////// String intrinsics ////////////////////////////////////////////
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  3477
36303
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3478
#ifdef COMPILER2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3479
// Intrinsics for CompactStrings
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3480
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3481
// Compress char[] to byte[] by compressing 16 bytes at once.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3482
void MacroAssembler::string_compress_16(Register src, Register dst, Register cnt,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3483
                                        Register tmp1, Register tmp2, Register tmp3, Register tmp4, Register tmp5,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3484
                                        Label& Lfailure) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3485
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3486
  const Register tmp0 = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3487
  assert_different_registers(src, dst, cnt, tmp0, tmp1, tmp2, tmp3, tmp4, tmp5);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3488
  Label Lloop, Lslow;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3489
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3490
  // Check if cnt >= 8 (= 16 bytes)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3491
  lis(tmp1, 0xFF);                // tmp1 = 0x00FF00FF00FF00FF
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3492
  srwi_(tmp2, cnt, 3);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3493
  beq(CCR0, Lslow);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3494
  ori(tmp1, tmp1, 0xFF);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3495
  rldimi(tmp1, tmp1, 32, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3496
  mtctr(tmp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3497
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3498
  // 2x unrolled loop
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3499
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3500
  ld(tmp2, 0, src);               // _0_1_2_3 (Big Endian)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3501
  ld(tmp4, 8, src);               // _4_5_6_7
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3502
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3503
  orr(tmp0, tmp2, tmp4);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3504
  rldicl(tmp3, tmp2, 6*8, 64-24); // _____1_2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3505
  rldimi(tmp2, tmp2, 2*8, 2*8);   // _0_2_3_3
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3506
  rldicl(tmp5, tmp4, 6*8, 64-24); // _____5_6
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3507
  rldimi(tmp4, tmp4, 2*8, 2*8);   // _4_6_7_7
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3508
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3509
  andc_(tmp0, tmp0, tmp1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3510
  bne(CCR0, Lfailure);            // Not latin1.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3511
  addi(src, src, 16);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3512
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3513
  rlwimi(tmp3, tmp2, 0*8, 24, 31);// _____1_3
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3514
  srdi(tmp2, tmp2, 3*8);          // ____0_2_
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3515
  rlwimi(tmp5, tmp4, 0*8, 24, 31);// _____5_7
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3516
  srdi(tmp4, tmp4, 3*8);          // ____4_6_
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3517
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3518
  orr(tmp2, tmp2, tmp3);          // ____0123
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3519
  orr(tmp4, tmp4, tmp5);          // ____4567
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3520
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3521
  stw(tmp2, 0, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3522
  stw(tmp4, 4, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3523
  addi(dst, dst, 8);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3524
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3525
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3526
  bind(Lslow);                    // Fallback to slow version
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3527
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3528
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3529
// Compress char[] to byte[]. cnt must be positive int.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3530
void MacroAssembler::string_compress(Register src, Register dst, Register cnt, Register tmp, Label& Lfailure) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3531
  Label Lloop;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3532
  mtctr(cnt);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3533
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3534
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3535
  lhz(tmp, 0, src);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3536
  cmplwi(CCR0, tmp, 0xff);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3537
  bgt(CCR0, Lfailure);            // Not latin1.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3538
  addi(src, src, 2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3539
  stb(tmp, 0, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3540
  addi(dst, dst, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3541
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3542
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3543
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3544
// Inflate byte[] to char[] by inflating 16 bytes at once.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3545
void MacroAssembler::string_inflate_16(Register src, Register dst, Register cnt,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3546
                                       Register tmp1, Register tmp2, Register tmp3, Register tmp4, Register tmp5) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3547
  const Register tmp0 = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3548
  assert_different_registers(src, dst, cnt, tmp0, tmp1, tmp2, tmp3, tmp4, tmp5);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3549
  Label Lloop, Lslow;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3550
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3551
  // Check if cnt >= 8
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3552
  srwi_(tmp2, cnt, 3);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3553
  beq(CCR0, Lslow);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3554
  lis(tmp1, 0xFF);                // tmp1 = 0x00FF00FF
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3555
  ori(tmp1, tmp1, 0xFF);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3556
  mtctr(tmp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3557
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3558
  // 2x unrolled loop
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3559
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3560
  lwz(tmp2, 0, src);              // ____0123 (Big Endian)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3561
  lwz(tmp4, 4, src);              // ____4567
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3562
  addi(src, src, 8);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3563
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3564
  rldicl(tmp3, tmp2, 7*8, 64-8);  // _______2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3565
  rlwimi(tmp2, tmp2, 3*8, 16, 23);// ____0113
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3566
  rldicl(tmp5, tmp4, 7*8, 64-8);  // _______6
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3567
  rlwimi(tmp4, tmp4, 3*8, 16, 23);// ____4557
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3568
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3569
  andc(tmp0, tmp2, tmp1);         // ____0_1_
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3570
  rlwimi(tmp2, tmp3, 2*8, 0, 23); // _____2_3
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3571
  andc(tmp3, tmp4, tmp1);         // ____4_5_
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3572
  rlwimi(tmp4, tmp5, 2*8, 0, 23); // _____6_7
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3573
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3574
  rldimi(tmp2, tmp0, 3*8, 0*8);   // _0_1_2_3
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3575
  rldimi(tmp4, tmp3, 3*8, 0*8);   // _4_5_6_7
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3576
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3577
  std(tmp2, 0, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3578
  std(tmp4, 8, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3579
  addi(dst, dst, 16);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3580
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3581
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3582
  bind(Lslow);                    // Fallback to slow version
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3583
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3584
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3585
// Inflate byte[] to char[]. cnt must be positive int.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3586
void MacroAssembler::string_inflate(Register src, Register dst, Register cnt, Register tmp) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3587
  Label Lloop;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3588
  mtctr(cnt);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3589
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3590
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3591
  lbz(tmp, 0, src);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3592
  addi(src, src, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3593
  sth(tmp, 0, dst);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3594
  addi(dst, dst, 2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3595
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3596
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3597
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3598
void MacroAssembler::string_compare(Register str1, Register str2,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3599
                                    Register cnt1, Register cnt2,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3600
                                    Register tmp1, Register result, int ae) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3601
  const Register tmp0 = R0,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3602
                 diff = tmp1;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3603
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3604
  assert_different_registers(str1, str2, cnt1, cnt2, tmp0, tmp1, result);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3605
  Label Ldone, Lslow, Lloop, Lreturn_diff;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3606
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3607
  // Note: Making use of the fact that compareTo(a, b) == -compareTo(b, a)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3608
  // we interchange str1 and str2 in the UL case and negate the result.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3609
  // Like this, str1 is always latin1 encoded, except for the UU case.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3610
  // In addition, we need 0 (or sign which is 0) extend.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3611
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3612
  if (ae == StrIntrinsicNode::UU) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3613
    srwi(cnt1, cnt1, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3614
  } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3615
    clrldi(cnt1, cnt1, 32);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3616
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3617
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3618
  if (ae != StrIntrinsicNode::LL) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3619
    srwi(cnt2, cnt2, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3620
  } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3621
    clrldi(cnt2, cnt2, 32);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3622
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3623
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3624
  // See if the lengths are different, and calculate min in cnt1.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3625
  // Save diff in case we need it for a tie-breaker.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3626
  subf_(diff, cnt2, cnt1); // diff = cnt1 - cnt2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3627
  // if (diff > 0) { cnt1 = cnt2; }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3628
  if (VM_Version::has_isel()) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3629
    isel(cnt1, CCR0, Assembler::greater, /*invert*/ false, cnt2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3630
  } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3631
    Label Lskip;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3632
    blt(CCR0, Lskip);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3633
    mr(cnt1, cnt2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3634
    bind(Lskip);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3635
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3636
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3637
  // Rename registers
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3638
  Register chr1 = result;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3639
  Register chr2 = tmp0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3640
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3641
  // Compare multiple characters in fast loop (only implemented for same encoding).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3642
  int stride1 = 8, stride2 = 8;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3643
  if (ae == StrIntrinsicNode::LL || ae == StrIntrinsicNode::UU) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3644
    int log2_chars_per_iter = (ae == StrIntrinsicNode::LL) ? 3 : 2;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3645
    Label Lfastloop, Lskipfast;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3646
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3647
    srwi_(tmp0, cnt1, log2_chars_per_iter);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3648
    beq(CCR0, Lskipfast);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3649
    rldicl(cnt2, cnt1, 0, 64 - log2_chars_per_iter); // Remaining characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3650
    li(cnt1, 1 << log2_chars_per_iter); // Initialize for failure case: Rescan characters from current iteration.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3651
    mtctr(tmp0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3652
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3653
    bind(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3654
    ld(chr1, 0, str1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3655
    ld(chr2, 0, str2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3656
    cmpd(CCR0, chr1, chr2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3657
    bne(CCR0, Lslow);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3658
    addi(str1, str1, stride1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3659
    addi(str2, str2, stride2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3660
    bdnz(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3661
    mr(cnt1, cnt2); // Remaining characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3662
    bind(Lskipfast);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3663
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3664
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3665
  // Loop which searches the first difference character by character.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3666
  cmpwi(CCR0, cnt1, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3667
  beq(CCR0, Lreturn_diff);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3668
  bind(Lslow);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3669
  mtctr(cnt1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3670
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3671
  switch (ae) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3672
    case StrIntrinsicNode::LL: stride1 = 1; stride2 = 1; break;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3673
    case StrIntrinsicNode::UL: // fallthru (see comment above)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3674
    case StrIntrinsicNode::LU: stride1 = 1; stride2 = 2; break;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3675
    case StrIntrinsicNode::UU: stride1 = 2; stride2 = 2; break;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3676
    default: ShouldNotReachHere(); break;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3677
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3678
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3679
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3680
  if (stride1 == 1) { lbz(chr1, 0, str1); } else { lhz(chr1, 0, str1); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3681
  if (stride2 == 1) { lbz(chr2, 0, str2); } else { lhz(chr2, 0, str2); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3682
  subf_(result, chr2, chr1); // result = chr1 - chr2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3683
  bne(CCR0, Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3684
  addi(str1, str1, stride1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3685
  addi(str2, str2, stride2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3686
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3687
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3688
  // If strings are equal up to min length, return the length difference.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3689
  bind(Lreturn_diff);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3690
  mr(result, diff);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3691
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3692
  // Otherwise, return the difference between the first mismatched chars.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3693
  bind(Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3694
  if (ae == StrIntrinsicNode::UL) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3695
    neg(result, result); // Negate result (see note above).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3696
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3697
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3698
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3699
void MacroAssembler::array_equals(bool is_array_equ, Register ary1, Register ary2,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3700
                                  Register limit, Register tmp1, Register result, bool is_byte) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3701
  const Register tmp0 = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3702
  assert_different_registers(ary1, ary2, limit, tmp0, tmp1, result);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3703
  Label Ldone, Lskiploop, Lloop, Lfastloop, Lskipfast;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3704
  bool limit_needs_shift = false;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3705
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3706
  if (is_array_equ) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3707
    const int length_offset = arrayOopDesc::length_offset_in_bytes();
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3708
    const int base_offset   = arrayOopDesc::base_offset_in_bytes(is_byte ? T_BYTE : T_CHAR);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3709
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3710
    // Return true if the same array.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3711
    cmpd(CCR0, ary1, ary2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3712
    beq(CCR0, Lskiploop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3713
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3714
    // Return false if one of them is NULL.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3715
    cmpdi(CCR0, ary1, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3716
    cmpdi(CCR1, ary2, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3717
    li(result, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3718
    cror(CCR0, Assembler::equal, CCR1, Assembler::equal);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3719
    beq(CCR0, Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3720
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3721
    // Load the lengths of arrays.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3722
    lwz(limit, length_offset, ary1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3723
    lwz(tmp0, length_offset, ary2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3724
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3725
    // Return false if the two arrays are not equal length.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3726
    cmpw(CCR0, limit, tmp0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3727
    bne(CCR0, Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3728
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3729
    // Load array addresses.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3730
    addi(ary1, ary1, base_offset);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3731
    addi(ary2, ary2, base_offset);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3732
  } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3733
    limit_needs_shift = !is_byte;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3734
    li(result, 0); // Assume not equal.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3735
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3736
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3737
  // Rename registers
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3738
  Register chr1 = tmp0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3739
  Register chr2 = tmp1;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3740
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3741
  // Compare 8 bytes per iteration in fast loop.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3742
  const int log2_chars_per_iter = is_byte ? 3 : 2;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3743
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3744
  srwi_(tmp0, limit, log2_chars_per_iter + (limit_needs_shift ? 1 : 0));
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3745
  beq(CCR0, Lskipfast);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3746
  mtctr(tmp0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3747
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3748
  bind(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3749
  ld(chr1, 0, ary1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3750
  ld(chr2, 0, ary2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3751
  addi(ary1, ary1, 8);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3752
  addi(ary2, ary2, 8);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3753
  cmpd(CCR0, chr1, chr2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3754
  bne(CCR0, Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3755
  bdnz(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3756
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3757
  bind(Lskipfast);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3758
  rldicl_(limit, limit, limit_needs_shift ? 64 - 1 : 0, 64 - log2_chars_per_iter); // Remaining characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3759
  beq(CCR0, Lskiploop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3760
  mtctr(limit);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3761
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3762
  // Character by character.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3763
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3764
  if (is_byte) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3765
    lbz(chr1, 0, ary1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3766
    lbz(chr2, 0, ary2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3767
    addi(ary1, ary1, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3768
    addi(ary2, ary2, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3769
  } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3770
    lhz(chr1, 0, ary1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3771
    lhz(chr2, 0, ary2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3772
    addi(ary1, ary1, 2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3773
    addi(ary2, ary2, 2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3774
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3775
  cmpw(CCR0, chr1, chr2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3776
  bne(CCR0, Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3777
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3778
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3779
  bind(Lskiploop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3780
  li(result, 1); // All characters are equal.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3781
  bind(Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3782
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3783
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3784
void MacroAssembler::string_indexof(Register result, Register haystack, Register haycnt,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3785
                                    Register needle, ciTypeArray* needle_values, Register needlecnt, int needlecntval,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3786
                                    Register tmp1, Register tmp2, Register tmp3, Register tmp4, int ae) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3787
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3788
  // Ensure 0<needlecnt<=haycnt in ideal graph as prerequisite!
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3789
  Label L_TooShort, L_Found, L_NotFound, L_End;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3790
  Register last_addr = haycnt, // Kill haycnt at the beginning.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3791
  addr      = tmp1,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3792
  n_start   = tmp2,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3793
  ch1       = tmp3,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3794
  ch2       = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3795
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3796
  assert(ae != StrIntrinsicNode::LU, "Invalid encoding");
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3797
  const int h_csize = (ae == StrIntrinsicNode::LL) ? 1 : 2;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3798
  const int n_csize = (ae == StrIntrinsicNode::UU) ? 2 : 1;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3799
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3800
  // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3801
  // Prepare for main loop: optimized for needle count >=2, bail out otherwise.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3802
  // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3803
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3804
  // Compute last haystack addr to use if no match gets found.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3805
  clrldi(haycnt, haycnt, 32);         // Ensure positive int is valid as 64 bit value.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3806
  addi(addr, haystack, -h_csize);     // Accesses use pre-increment.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3807
  if (needlecntval == 0) { // variable needlecnt
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3808
   cmpwi(CCR6, needlecnt, 2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3809
   clrldi(needlecnt, needlecnt, 32);  // Ensure positive int is valid as 64 bit value.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3810
   blt(CCR6, L_TooShort);             // Variable needlecnt: handle short needle separately.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3811
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3812
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3813
  if (n_csize == 2) { lwz(n_start, 0, needle); } else { lhz(n_start, 0, needle); } // Load first 2 characters of needle.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3814
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3815
  if (needlecntval == 0) { // variable needlecnt
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3816
   subf(ch1, needlecnt, haycnt);      // Last character index to compare is haycnt-needlecnt.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3817
   addi(needlecnt, needlecnt, -2);    // Rest of needle.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3818
  } else { // constant needlecnt
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3819
  guarantee(needlecntval != 1, "IndexOf with single-character needle must be handled separately");
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3820
  assert((needlecntval & 0x7fff) == needlecntval, "wrong immediate");
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3821
   addi(ch1, haycnt, -needlecntval);  // Last character index to compare is haycnt-needlecnt.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3822
   if (needlecntval > 3) { li(needlecnt, needlecntval - 2); } // Rest of needle.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3823
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3824
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3825
  if (h_csize == 2) { slwi(ch1, ch1, 1); } // Scale to number of bytes.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3826
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3827
  if (ae ==StrIntrinsicNode::UL) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3828
   srwi(tmp4, n_start, 1*8);          // ___0
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3829
   rlwimi(n_start, tmp4, 2*8, 0, 23); // _0_1
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3830
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3831
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3832
  add(last_addr, haystack, ch1);      // Point to last address to compare (haystack+2*(haycnt-needlecnt)).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3833
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3834
  // Main Loop (now we have at least 2 characters).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3835
  Label L_OuterLoop, L_InnerLoop, L_FinalCheck, L_Comp1, L_Comp2;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3836
  bind(L_OuterLoop); // Search for 1st 2 characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3837
  Register addr_diff = tmp4;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3838
   subf(addr_diff, addr, last_addr);  // Difference between already checked address and last address to check.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3839
   addi(addr, addr, h_csize);         // This is the new address we want to use for comparing.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3840
   srdi_(ch2, addr_diff, h_csize);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3841
   beq(CCR0, L_FinalCheck);           // 2 characters left?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3842
   mtctr(ch2);                        // num of characters / 2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3843
  bind(L_InnerLoop);                  // Main work horse (2x unrolled search loop)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3844
   if (h_csize == 2) {                // Load 2 characters of haystack (ignore alignment).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3845
    lwz(ch1, 0, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3846
    lwz(ch2, 2, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3847
   } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3848
    lhz(ch1, 0, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3849
    lhz(ch2, 1, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3850
   }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3851
   cmpw(CCR0, ch1, n_start);          // Compare 2 characters (1 would be sufficient but try to reduce branches to CompLoop).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3852
   cmpw(CCR1, ch2, n_start);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3853
   beq(CCR0, L_Comp1);                // Did we find the needle start?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3854
   beq(CCR1, L_Comp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3855
   addi(addr, addr, 2 * h_csize);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3856
   bdnz(L_InnerLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3857
  bind(L_FinalCheck);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3858
   andi_(addr_diff, addr_diff, h_csize); // Remaining characters not covered by InnerLoop: (num of characters) & 1.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3859
   beq(CCR0, L_NotFound);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3860
   if (h_csize == 2) { lwz(ch1, 0, addr); } else { lhz(ch1, 0, addr); } // One position left at which we have to compare.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3861
   cmpw(CCR1, ch1, n_start);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3862
   beq(CCR1, L_Comp1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3863
  bind(L_NotFound);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3864
   li(result, -1);                    // not found
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3865
   b(L_End);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3866
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3867
   // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3868
   // Special Case: unfortunately, the variable needle case can be called with needlecnt<2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3869
   // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3870
  if (needlecntval == 0) {           // We have to handle these cases separately.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3871
  Label L_OneCharLoop;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3872
  bind(L_TooShort);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3873
   mtctr(haycnt);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3874
   if (n_csize == 2) { lhz(n_start, 0, needle); } else { lbz(n_start, 0, needle); } // First character of needle
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3875
  bind(L_OneCharLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3876
   if (h_csize == 2) { lhzu(ch1, 2, addr); } else { lbzu(ch1, 1, addr); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3877
   cmpw(CCR1, ch1, n_start);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3878
   beq(CCR1, L_Found);               // Did we find the one character needle?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3879
   bdnz(L_OneCharLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3880
   li(result, -1);                   // Not found.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3881
   b(L_End);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3882
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3883
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3884
  // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3885
  // Regular Case Part II: compare rest of needle (first 2 characters have been compared already)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3886
  // **************************************************************************************************
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3887
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3888
  // Compare the rest
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3889
  bind(L_Comp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3890
   addi(addr, addr, h_csize);        // First comparison has failed, 2nd one hit.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3891
  bind(L_Comp1);                     // Addr points to possible needle start.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3892
  if (needlecntval != 2) {           // Const needlecnt==2?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3893
   if (needlecntval != 3) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3894
    if (needlecntval == 0) { beq(CCR6, L_Found); } // Variable needlecnt==2?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3895
    Register n_ind = tmp4,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3896
             h_ind = n_ind;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3897
    li(n_ind, 2 * n_csize);          // First 2 characters are already compared, use index 2.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3898
    mtctr(needlecnt);                // Decremented by 2, still > 0.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3899
   Label L_CompLoop;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3900
   bind(L_CompLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3901
    if (ae ==StrIntrinsicNode::UL) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3902
      h_ind = ch1;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3903
      sldi(h_ind, n_ind, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3904
    }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3905
    if (n_csize == 2) { lhzx(ch2, needle, n_ind); } else { lbzx(ch2, needle, n_ind); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3906
    if (h_csize == 2) { lhzx(ch1, addr, h_ind); } else { lbzx(ch1, addr, h_ind); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3907
    cmpw(CCR1, ch1, ch2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3908
    bne(CCR1, L_OuterLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3909
    addi(n_ind, n_ind, n_csize);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3910
    bdnz(L_CompLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3911
   } else { // No loop required if there's only one needle character left.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3912
    if (n_csize == 2) { lhz(ch2, 2 * 2, needle); } else { lbz(ch2, 2 * 1, needle); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3913
    if (h_csize == 2) { lhz(ch1, 2 * 2, addr); } else { lbz(ch1, 2 * 1, addr); }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3914
    cmpw(CCR1, ch1, ch2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3915
    bne(CCR1, L_OuterLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3916
   }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3917
  }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3918
  // Return index ...
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3919
  bind(L_Found);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3920
   subf(result, haystack, addr);     // relative to haystack, ...
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3921
   if (h_csize == 2) { srdi(result, result, 1); } // in characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3922
  bind(L_End);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3923
} // string_indexof
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3924
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3925
void MacroAssembler::string_indexof_char(Register result, Register haystack, Register haycnt,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3926
                                         Register needle, jchar needleChar, Register tmp1, Register tmp2, bool is_byte) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3927
  assert_different_registers(haystack, haycnt, needle, tmp1, tmp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3928
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3929
  Label L_InnerLoop, L_FinalCheck, L_Found1, L_Found2, L_NotFound, L_End;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3930
  Register addr = tmp1,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3931
           ch1 = tmp2,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3932
           ch2 = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3933
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3934
  const int h_csize = is_byte ? 1 : 2;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3935
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3936
//4:
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3937
   srwi_(tmp2, haycnt, 1);   // Shift right by exact_log2(UNROLL_FACTOR).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3938
   mr(addr, haystack);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3939
   beq(CCR0, L_FinalCheck);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3940
   mtctr(tmp2);              // Move to count register.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3941
//8:
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3942
  bind(L_InnerLoop);         // Main work horse (2x unrolled search loop).
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3943
   if (!is_byte) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3944
    lhz(ch1, 0, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3945
    lhz(ch2, 2, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3946
   } else {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3947
    lbz(ch1, 0, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3948
    lbz(ch2, 1, addr);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3949
   }
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3950
   (needle != R0) ? cmpw(CCR0, ch1, needle) : cmplwi(CCR0, ch1, (unsigned int)needleChar);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3951
   (needle != R0) ? cmpw(CCR1, ch2, needle) : cmplwi(CCR1, ch2, (unsigned int)needleChar);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3952
   beq(CCR0, L_Found1);      // Did we find the needle?
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3953
   beq(CCR1, L_Found2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3954
   addi(addr, addr, 2 * h_csize);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3955
   bdnz(L_InnerLoop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3956
//16:
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3957
  bind(L_FinalCheck);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3958
   andi_(R0, haycnt, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3959
   beq(CCR0, L_NotFound);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3960
   if (!is_byte) { lhz(ch1, 0, addr); } else { lbz(ch1, 0, addr); } // One position left at which we have to compare.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3961
   (needle != R0) ? cmpw(CCR1, ch1, needle) : cmplwi(CCR1, ch1, (unsigned int)needleChar);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3962
   beq(CCR1, L_Found1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3963
//21:
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3964
  bind(L_NotFound);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3965
   li(result, -1);           // Not found.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3966
   b(L_End);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3967
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3968
  bind(L_Found2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3969
   addi(addr, addr, h_csize);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3970
//24:
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3971
  bind(L_Found1);            // Return index ...
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3972
   subf(result, haystack, addr); // relative to haystack, ...
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3973
   if (!is_byte) { srdi(result, result, 1); } // in characters.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3974
  bind(L_End);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3975
} // string_indexof_char
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3976
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3977
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3978
void MacroAssembler::has_negatives(Register src, Register cnt, Register result,
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3979
                                   Register tmp1, Register tmp2) {
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3980
  const Register tmp0 = R0;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3981
  assert_different_registers(src, result, cnt, tmp0, tmp1, tmp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3982
  Label Lfastloop, Lslow, Lloop, Lnoneg, Ldone;
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3983
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3984
  // Check if cnt >= 8 (= 16 bytes)
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3985
  lis(tmp1, (int)(short)0x8080);  // tmp1 = 0x8080808080808080
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3986
  srwi_(tmp2, cnt, 4);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3987
  li(result, 1);                  // Assume there's a negative byte.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3988
  beq(CCR0, Lslow);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3989
  ori(tmp1, tmp1, 0x8080);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3990
  rldimi(tmp1, tmp1, 32, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3991
  mtctr(tmp2);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3992
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3993
  // 2x unrolled loop
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3994
  bind(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3995
  ld(tmp2, 0, src);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3996
  ld(tmp0, 8, src);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3997
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3998
  orr(tmp0, tmp2, tmp0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  3999
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4000
  and_(tmp0, tmp0, tmp1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4001
  bne(CCR0, Ldone);               // Found negative byte.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4002
  addi(src, src, 16);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4003
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4004
  bdnz(Lfastloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4005
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4006
  bind(Lslow);                    // Fallback to slow version
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4007
  rldicl_(tmp0, cnt, 0, 64-4);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4008
  beq(CCR0, Lnoneg);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4009
  mtctr(tmp0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4010
  bind(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4011
  lbz(tmp0, 0, src);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4012
  addi(src, src, 1);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4013
  andi_(tmp0, tmp0, 0x80);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4014
  bne(CCR0, Ldone);               // Found negative byte.
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4015
  bdnz(Lloop);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4016
  bind(Lnoneg);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4017
  li(result, 0);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4018
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4019
  bind(Ldone);
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4020
}
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4021
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4022
#endif // Compiler2
6241574f5982 8149655: PPC64: Implement CompactString intrinsics
mdoerr
parents: 35913
diff changeset
  4023
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4024
// Helpers for Intrinsic Emitters
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4025
//
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4026
// Revert the byte order of a 32bit value in a register
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4027
//   src: 0x44556677
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4028
//   dst: 0x77665544
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4029
// Three steps to obtain the result:
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4030
//  1) Rotate src (as doubleword) left 5 bytes. That puts the leftmost byte of the src word
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4031
//     into the rightmost byte position. Afterwards, everything left of the rightmost byte is cleared.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4032
//     This value initializes dst.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4033
//  2) Rotate src (as word) left 3 bytes. That puts the rightmost byte of the src word into the leftmost
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4034
//     byte position. Furthermore, byte 5 is rotated into byte 6 position where it is supposed to go.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4035
//     This value is mask inserted into dst with a [0..23] mask of 1s.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4036
//  3) Rotate src (as word) left 1 byte. That puts byte 6 into byte 5 position.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4037
//     This value is mask inserted into dst with a [8..15] mask of 1s.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4038
void MacroAssembler::load_reverse_32(Register dst, Register src) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4039
  assert_different_registers(dst, src);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4040
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4041
  rldicl(dst, src, (4+1)*8, 56);       // Rotate byte 4 into position 7 (rightmost), clear all to the left.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4042
  rlwimi(dst, src,     3*8,  0, 23);   // Insert byte 5 into position 6, 7 into 4, leave pos 7 alone.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4043
  rlwimi(dst, src,     1*8,  8, 15);   // Insert byte 6 into position 5, leave the rest alone.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4044
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4045
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4046
// Calculate the column addresses of the crc32 lookup table into distinct registers.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4047
// This loop-invariant calculation is moved out of the loop body, reducing the loop
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4048
// body size from 20 to 16 instructions.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4049
// Returns the offset that was used to calculate the address of column tc3.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4050
// Due to register shortage, setting tc3 may overwrite table. With the return offset
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4051
// at hand, the original table address can be easily reconstructed.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4052
int MacroAssembler::crc32_table_columns(Register table, Register tc0, Register tc1, Register tc2, Register tc3) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4053
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4054
#ifdef VM_LITTLE_ENDIAN
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4055
  // This is what we implement (the DOLIT4 part):
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4056
  // ========================================================================= */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4057
  // #define DOLIT4 c ^= *buf4++; \
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4058
  //         c = crc_table[3][c & 0xff] ^ crc_table[2][(c >> 8) & 0xff] ^ \
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4059
  //             crc_table[1][(c >> 16) & 0xff] ^ crc_table[0][c >> 24]
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4060
  // #define DOLIT32 DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4; DOLIT4
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4061
  // ========================================================================= */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4062
  const int ix0 = 3*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4063
  const int ix1 = 2*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4064
  const int ix2 = 1*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4065
  const int ix3 = 0*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4066
#else
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4067
  // This is what we implement (the DOBIG4 part):
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4068
  // =========================================================================
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4069
  // #define DOBIG4 c ^= *++buf4; \
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4070
  //         c = crc_table[4][c & 0xff] ^ crc_table[5][(c >> 8) & 0xff] ^ \
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4071
  //             crc_table[6][(c >> 16) & 0xff] ^ crc_table[7][c >> 24]
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4072
  // #define DOBIG32 DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4; DOBIG4
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4073
  // =========================================================================
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4074
  const int ix0 = 4*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4075
  const int ix1 = 5*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4076
  const int ix2 = 6*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4077
  const int ix3 = 7*(4*CRC32_COLUMN_SIZE);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4078
#endif
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4079
  assert_different_registers(table, tc0, tc1, tc2);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4080
  assert(table == tc3, "must be!");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4081
35541
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4082
  addi(tc0, table, ix0);
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4083
  addi(tc1, table, ix1);
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4084
  addi(tc2, table, ix2);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4085
  if (ix3 != 0) addi(tc3, table, ix3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4086
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4087
  return ix3;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4088
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4089
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4090
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4091
 * uint32_t crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4092
 * timesXtoThe32[crc & 0xFF] ^ (crc >> 8);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4093
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4094
void MacroAssembler::fold_byte_crc32(Register crc, Register val, Register table, Register tmp) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4095
  assert_different_registers(crc, table, tmp);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4096
  assert_different_registers(val, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4097
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4098
  if (crc == val) {                   // Must rotate first to use the unmodified value.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4099
    rlwinm(tmp, val, 2, 24-2, 31-2);  // Insert (rightmost) byte 7 of val, shifted left by 2, into byte 6..7 of tmp, clear the rest.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4100
                                      // As we use a word (4-byte) instruction, we have to adapt the mask bit positions.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4101
    srwi(crc, crc, 8);                // Unsigned shift, clear leftmost 8 bits.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4102
  } else {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4103
    srwi(crc, crc, 8);                // Unsigned shift, clear leftmost 8 bits.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4104
    rlwinm(tmp, val, 2, 24-2, 31-2);  // Insert (rightmost) byte 7 of val, shifted left by 2, into byte 6..7 of tmp, clear the rest.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4105
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4106
  lwzx(tmp, table, tmp);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4107
  xorr(crc, crc, tmp);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4108
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4109
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4110
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4111
 * uint32_t crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4112
 * timesXtoThe32[crc & 0xFF] ^ (crc >> 8);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4113
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4114
void MacroAssembler::fold_8bit_crc32(Register crc, Register table, Register tmp) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4115
  fold_byte_crc32(crc, crc, table, tmp);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4116
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4117
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4118
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4119
 * Emits code to update CRC-32 with a byte value according to constants in table.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4120
 *
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4121
 * @param [in,out]crc   Register containing the crc.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4122
 * @param [in]val       Register containing the byte to fold into the CRC.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4123
 * @param [in]table     Register containing the table of crc constants.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4124
 *
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4125
 * uint32_t crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4126
 * val = crc_table[(val ^ crc) & 0xFF];
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4127
 * crc = val ^ (crc >> 8);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4128
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4129
void MacroAssembler::update_byte_crc32(Register crc, Register val, Register table) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4130
  BLOCK_COMMENT("update_byte_crc32:");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4131
  xorr(val, val, crc);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4132
  fold_byte_crc32(crc, val, table, val);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4133
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4134
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4135
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4136
 * @param crc   register containing existing CRC (32-bit)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4137
 * @param buf   register pointing to input byte buffer (byte*)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4138
 * @param len   register containing number of bytes
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4139
 * @param table register pointing to CRC table
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4140
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4141
void MacroAssembler::update_byteLoop_crc32(Register crc, Register buf, Register len, Register table,
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4142
                                           Register data, bool loopAlignment) {
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4143
  assert_different_registers(crc, buf, len, table, data);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4144
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4145
  Label L_mainLoop, L_done;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4146
  const int mainLoop_stepping  = 1;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4147
  const int mainLoop_alignment = loopAlignment ? 32 : 4; // (InputForNewCode > 4 ? InputForNewCode : 32) : 4;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4148
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4149
  // Process all bytes in a single-byte loop.
35541
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4150
  clrldi_(len, len, 32);                         // Enforce 32 bit. Anything to do?
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4151
  beq(CCR0, L_done);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4152
35541
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4153
  mtctr(len);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4154
  align(mainLoop_alignment);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4155
  BIND(L_mainLoop);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4156
    lbz(data, 0, buf);                           // Byte from buffer, zero-extended.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4157
    addi(buf, buf, mainLoop_stepping);           // Advance buffer position.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4158
    update_byte_crc32(crc, data, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4159
    bdnz(L_mainLoop);                            // Iterate.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4160
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4161
  bind(L_done);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4162
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4163
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4164
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4165
 * Emits code to update CRC-32 with a 4-byte value according to constants in table
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4166
 * Implementation according to jdk/src/share/native/java/util/zip/zlib-1.2.8/crc32.c
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4167
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4168
// A not on the lookup table address(es):
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4169
// The lookup table consists of two sets of four columns each.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4170
// The columns {0..3} are used for little-endian machines.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4171
// The columns {4..7} are used for big-endian machines.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4172
// To save the effort of adding the column offset to the table address each time
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4173
// a table element is looked up, it is possible to pass the pre-calculated
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4174
// column addresses.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4175
// Uses R9..R12 as work register. Must be saved/restored by caller, if necessary.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4176
void MacroAssembler::update_1word_crc32(Register crc, Register buf, Register table, int bufDisp, int bufInc,
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4177
                                        Register t0,  Register t1,  Register t2,  Register t3,
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4178
                                        Register tc0, Register tc1, Register tc2, Register tc3) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4179
  assert_different_registers(crc, t3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4180
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4181
  // XOR crc with next four bytes of buffer.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4182
  lwz(t3, bufDisp, buf);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4183
  if (bufInc != 0) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4184
    addi(buf, buf, bufInc);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4185
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4186
  xorr(t3, t3, crc);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4187
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4188
  // Chop crc into 4 single-byte pieces, shifted left 2 bits, to form the table indices.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4189
  rlwinm(t0, t3,  2,         24-2, 31-2);  // ((t1 >>  0) & 0xff) << 2
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4190
  rlwinm(t1, t3,  32+(2- 8), 24-2, 31-2);  // ((t1 >>  8) & 0xff) << 2
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4191
  rlwinm(t2, t3,  32+(2-16), 24-2, 31-2);  // ((t1 >> 16) & 0xff) << 2
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4192
  rlwinm(t3, t3,  32+(2-24), 24-2, 31-2);  // ((t1 >> 24) & 0xff) << 2
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4193
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4194
  // Use the pre-calculated column addresses.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4195
  // Load pre-calculated table values.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4196
  lwzx(t0, tc0, t0);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4197
  lwzx(t1, tc1, t1);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4198
  lwzx(t2, tc2, t2);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4199
  lwzx(t3, tc3, t3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4200
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4201
  // Calculate new crc from table values.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4202
  xorr(t0,  t0, t1);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4203
  xorr(t2,  t2, t3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4204
  xorr(crc, t0, t2);  // Now crc contains the final checksum value.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4205
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4206
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4207
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4208
 * @param crc   register containing existing CRC (32-bit)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4209
 * @param buf   register pointing to input byte buffer (byte*)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4210
 * @param len   register containing number of bytes
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4211
 * @param table register pointing to CRC table
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4212
 *
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4213
 * Uses R9..R12 as work register. Must be saved/restored by caller!
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4214
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4215
void MacroAssembler::kernel_crc32_2word(Register crc, Register buf, Register len, Register table,
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4216
                                        Register t0,  Register t1,  Register t2,  Register t3,
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4217
                                        Register tc0, Register tc1, Register tc2, Register tc3,
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4218
                                        bool invertCRC) {
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4219
  assert_different_registers(crc, buf, len, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4220
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4221
  Label L_mainLoop, L_tail;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4222
  Register  tmp  = t0;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4223
  Register  data = t0;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4224
  Register  tmp2 = t1;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4225
  const int mainLoop_stepping  = 8;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4226
  const int tailLoop_stepping  = 1;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4227
  const int log_stepping       = exact_log2(mainLoop_stepping);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4228
  const int mainLoop_alignment = 32; // InputForNewCode > 4 ? InputForNewCode : 32;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4229
  const int complexThreshold   = 2*mainLoop_stepping;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4230
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4231
  // Don't test for len <= 0 here. This pathological case should not occur anyway.
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4232
  // Optimizing for it by adding a test and a branch seems to be a waste of CPU cycles
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4233
  // for all well-behaved cases. The situation itself is detected and handled correctly
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4234
  // within update_byteLoop_crc32.
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4235
  assert(tailLoop_stepping == 1, "check tailLoop_stepping!");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4236
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4237
  BLOCK_COMMENT("kernel_crc32_2word {");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4238
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4239
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4240
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4241
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4242
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4243
  // Check for short (<mainLoop_stepping) buffer.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4244
  cmpdi(CCR0, len, complexThreshold);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4245
  blt(CCR0, L_tail);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4246
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4247
  // Pre-mainLoop alignment did show a slight (1%) positive effect on performance.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4248
  // We leave the code in for reference. Maybe we need alignment when we exploit vector instructions.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4249
  {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4250
    // Align buf addr to mainLoop_stepping boundary.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4251
    neg(tmp2, buf);                           // Calculate # preLoop iterations for alignment.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4252
    rldicl(tmp2, tmp2, 0, 64-log_stepping);   // Rotate tmp2 0 bits, insert into tmp2, anding with mask with 1s from 62..63.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4253
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4254
    if (complexThreshold > mainLoop_stepping) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4255
      sub(len, len, tmp2);                       // Remaining bytes for main loop (>=mainLoop_stepping is guaranteed).
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4256
    } else {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4257
      sub(tmp, len, tmp2);                       // Remaining bytes for main loop.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4258
      cmpdi(CCR0, tmp, mainLoop_stepping);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4259
      blt(CCR0, L_tail);                         // For less than one mainloop_stepping left, do only tail processing
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4260
      mr(len, tmp);                              // remaining bytes for main loop (>=mainLoop_stepping is guaranteed).
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4261
    }
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4262
    update_byteLoop_crc32(crc, buf, tmp2, table, data, false);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4263
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4264
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4265
  srdi(tmp2, len, log_stepping);                 // #iterations for mainLoop
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4266
  andi(len, len, mainLoop_stepping-1);           // remaining bytes for tailLoop
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4267
  mtctr(tmp2);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4268
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4269
#ifdef VM_LITTLE_ENDIAN
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4270
  Register crc_rv = crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4271
#else
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4272
  Register crc_rv = tmp;                         // Load_reverse needs separate registers to work on.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4273
                                                 // Occupies tmp, but frees up crc.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4274
  load_reverse_32(crc_rv, crc);                  // Revert byte order because we are dealing with big-endian data.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4275
  tmp = crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4276
#endif
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4277
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4278
  int reconstructTableOffset = crc32_table_columns(table, tc0, tc1, tc2, tc3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4279
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4280
  align(mainLoop_alignment);                     // Octoword-aligned loop address. Shows 2% improvement.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4281
  BIND(L_mainLoop);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4282
    update_1word_crc32(crc_rv, buf, table, 0, 0, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4283
    update_1word_crc32(crc_rv, buf, table, 4, mainLoop_stepping, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4284
    bdnz(L_mainLoop);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4285
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4286
#ifndef VM_LITTLE_ENDIAN
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4287
  load_reverse_32(crc, crc_rv);                  // Revert byte order because we are dealing with big-endian data.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4288
  tmp = crc_rv;                                  // Tmp uses it's original register again.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4289
#endif
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4290
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4291
  // Restore original table address for tailLoop.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4292
  if (reconstructTableOffset != 0) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4293
    addi(table, table, -reconstructTableOffset);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4294
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4295
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4296
  // Process last few (<complexThreshold) bytes of buffer.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4297
  BIND(L_tail);
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4298
  update_byteLoop_crc32(crc, buf, len, table, data, false);
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4299
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4300
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4301
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4302
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4303
  BLOCK_COMMENT("} kernel_crc32_2word");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4304
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4305
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4306
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4307
 * @param crc   register containing existing CRC (32-bit)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4308
 * @param buf   register pointing to input byte buffer (byte*)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4309
 * @param len   register containing number of bytes
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4310
 * @param table register pointing to CRC table
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4311
 *
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4312
 * uses R9..R12 as work register. Must be saved/restored by caller!
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4313
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4314
void MacroAssembler::kernel_crc32_1word(Register crc, Register buf, Register len, Register table,
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4315
                                        Register t0,  Register t1,  Register t2,  Register t3,
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4316
                                        Register tc0, Register tc1, Register tc2, Register tc3,
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4317
                                        bool invertCRC) {
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4318
  assert_different_registers(crc, buf, len, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4319
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4320
  Label L_mainLoop, L_tail;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4321
  Register  tmp          = t0;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4322
  Register  data         = t0;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4323
  Register  tmp2         = t1;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4324
  const int mainLoop_stepping  = 4;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4325
  const int tailLoop_stepping  = 1;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4326
  const int log_stepping       = exact_log2(mainLoop_stepping);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4327
  const int mainLoop_alignment = 32; // InputForNewCode > 4 ? InputForNewCode : 32;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4328
  const int complexThreshold   = 2*mainLoop_stepping;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4329
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4330
  // Don't test for len <= 0 here. This pathological case should not occur anyway.
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4331
  // Optimizing for it by adding a test and a branch seems to be a waste of CPU cycles
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4332
  // for all well-behaved cases. The situation itself is detected and handled correctly
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4333
  // within update_byteLoop_crc32.
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4334
  assert(tailLoop_stepping == 1, "check tailLoop_stepping!");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4335
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4336
  BLOCK_COMMENT("kernel_crc32_1word {");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4337
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4338
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4339
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4340
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4341
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4342
  // Check for short (<mainLoop_stepping) buffer.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4343
  cmpdi(CCR0, len, complexThreshold);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4344
  blt(CCR0, L_tail);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4345
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4346
  // Pre-mainLoop alignment did show a slight (1%) positive effect on performance.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4347
  // We leave the code in for reference. Maybe we need alignment when we exploit vector instructions.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4348
  {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4349
    // Align buf addr to mainLoop_stepping boundary.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4350
    neg(tmp2, buf);                              // Calculate # preLoop iterations for alignment.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4351
    rldicl(tmp2, tmp2, 0, 64-log_stepping);      // Rotate tmp2 0 bits, insert into tmp2, anding with mask with 1s from 62..63.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4352
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4353
    if (complexThreshold > mainLoop_stepping) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4354
      sub(len, len, tmp2);                       // Remaining bytes for main loop (>=mainLoop_stepping is guaranteed).
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4355
    } else {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4356
      sub(tmp, len, tmp2);                       // Remaining bytes for main loop.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4357
      cmpdi(CCR0, tmp, mainLoop_stepping);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4358
      blt(CCR0, L_tail);                         // For less than one mainloop_stepping left, do only tail processing
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4359
      mr(len, tmp);                              // remaining bytes for main loop (>=mainLoop_stepping is guaranteed).
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4360
    }
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4361
    update_byteLoop_crc32(crc, buf, tmp2, table, data, false);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4362
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4363
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4364
  srdi(tmp2, len, log_stepping);                 // #iterations for mainLoop
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4365
  andi(len, len, mainLoop_stepping-1);           // remaining bytes for tailLoop
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4366
  mtctr(tmp2);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4367
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4368
#ifdef VM_LITTLE_ENDIAN
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4369
  Register crc_rv = crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4370
#else
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4371
  Register crc_rv = tmp;                         // Load_reverse needs separate registers to work on.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4372
                                                 // Occupies tmp, but frees up crc.
35541
cba047a086d5 8146613: PPC64: C2 does no longer respect int to long conversion for stub calls
mdoerr
parents: 35085
diff changeset
  4373
  load_reverse_32(crc_rv, crc);                  // Revert byte order because we are dealing with big-endian data.
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4374
  tmp = crc;
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4375
#endif
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4376
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4377
  int reconstructTableOffset = crc32_table_columns(table, tc0, tc1, tc2, tc3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4378
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4379
  align(mainLoop_alignment);                     // Octoword-aligned loop address. Shows 2% improvement.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4380
  BIND(L_mainLoop);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4381
    update_1word_crc32(crc_rv, buf, table, 0, mainLoop_stepping, crc_rv, t1, t2, t3, tc0, tc1, tc2, tc3);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4382
    bdnz(L_mainLoop);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4383
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4384
#ifndef VM_LITTLE_ENDIAN
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4385
  load_reverse_32(crc, crc_rv);                  // Revert byte order because we are dealing with big-endian data.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4386
  tmp = crc_rv;                                  // Tmp uses it's original register again.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4387
#endif
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4388
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4389
  // Restore original table address for tailLoop.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4390
  if (reconstructTableOffset != 0) {
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4391
    addi(table, table, -reconstructTableOffset);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4392
  }
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4393
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4394
  // Process last few (<complexThreshold) bytes of buffer.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4395
  BIND(L_tail);
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4396
  update_byteLoop_crc32(crc, buf, len, table, data, false);
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4397
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4398
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4399
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4400
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4401
  BLOCK_COMMENT("} kernel_crc32_1word");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4402
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4403
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4404
/**
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4405
 * @param crc   register containing existing CRC (32-bit)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4406
 * @param buf   register pointing to input byte buffer (byte*)
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4407
 * @param len   register containing number of bytes
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4408
 * @param table register pointing to CRC table
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4409
 *
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4410
 * Uses R7_ARG5, R8_ARG6 as work registers.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4411
 */
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4412
void MacroAssembler::kernel_crc32_1byte(Register crc, Register buf, Register len, Register table,
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4413
                                        Register t0,  Register t1,  Register t2,  Register t3,
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4414
                                        bool invertCRC) {
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4415
  assert_different_registers(crc, buf, len, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4416
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4417
  Register  data = t0;                   // Holds the current byte to be folded into crc.
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4418
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4419
  BLOCK_COMMENT("kernel_crc32_1byte {");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4420
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4421
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4422
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4423
  }
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4424
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4425
  // Process all bytes in a single-byte loop.
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4426
  update_byteLoop_crc32(crc, buf, len, table, data, true);
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4427
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4428
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4429
    nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4430
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4431
  BLOCK_COMMENT("} kernel_crc32_1byte");
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4432
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4433
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4434
/**
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4435
 * @param crc             register containing existing CRC (32-bit)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4436
 * @param buf             register pointing to input byte buffer (byte*)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4437
 * @param len             register containing number of bytes
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4438
 * @param table           register pointing to CRC table
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4439
 * @param constants       register pointing to CRC table for 128-bit aligned memory
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4440
 * @param barretConstants register pointing to table for barrett reduction
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4441
 * @param t0              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4442
 * @param t1              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4443
 * @param t2              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4444
 * @param t3              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4445
 */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4446
void MacroAssembler::kernel_crc32_1word_vpmsumd(Register crc, Register buf, Register len, Register table,
42068
18c8a4d5998e 8168083: PPC64: Cleanup template interpreter after 8154580 and 8154867
mdoerr
parents: 41334
diff changeset
  4447
                                                Register constants,  Register barretConstants,
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4448
                                                Register t0,  Register t1, Register t2, Register t3, Register t4,
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4449
                                                bool invertCRC) {
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4450
  assert_different_registers(crc, buf, len, table);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4451
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4452
  Label L_alignedHead, L_tail, L_alignTail, L_start, L_end;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4453
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4454
  Register  prealign     = t0;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4455
  Register  postalign    = t0;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4456
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4457
  BLOCK_COMMENT("kernel_crc32_1word_vpmsumb {");
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4458
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4459
  // 1. use kernel_crc32_1word for shorter than 384bit
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4460
  clrldi(len, len, 32);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4461
  cmpdi(CCR0, len, 384);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4462
  bge(CCR0, L_start);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4463
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4464
    Register tc0 = t4;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4465
    Register tc1 = constants;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4466
    Register tc2 = barretConstants;
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4467
    kernel_crc32_1word(crc, buf, len, table,t0, t1, t2, t3, tc0, tc1, tc2, table, invertCRC);
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4468
    b(L_end);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4469
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4470
  BIND(L_start);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4471
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4472
    // 2. ~c
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4473
    if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4474
      nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4475
    }
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4476
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4477
    // 3. calculate from 0 to first 128bit-aligned address
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4478
    clrldi_(prealign, buf, 57);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4479
    beq(CCR0, L_alignedHead);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4480
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4481
    subfic(prealign, prealign, 128);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4482
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4483
    subf(len, prealign, len);
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4484
    update_byteLoop_crc32(crc, buf, prealign, table, t2, false);
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4485
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4486
    // 4. calculate from first 128bit-aligned address to last 128bit-aligned address
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4487
    BIND(L_alignedHead);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4488
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4489
    clrldi(postalign, len, 57);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4490
    subf(len, postalign, len);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4491
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4492
    // len must be more than 256bit
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4493
    kernel_crc32_1word_aligned(crc, buf, len, constants, barretConstants, t1, t2, t3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4494
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4495
    // 5. calculate remaining
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4496
    cmpdi(CCR0, postalign, 0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4497
    beq(CCR0, L_tail);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4498
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4499
    update_byteLoop_crc32(crc, buf, postalign, table, t2, false);
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4500
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4501
    BIND(L_tail);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4502
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4503
    // 6. ~c
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4504
    if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4505
      nand(crc, crc, crc);                      // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4506
    }
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4507
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4508
  BIND(L_end);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4509
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4510
  BLOCK_COMMENT("} kernel_crc32_1word_vpmsumb");
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4511
}
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4512
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4513
/**
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4514
 * @param crc             register containing existing CRC (32-bit)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4515
 * @param buf             register pointing to input byte buffer (byte*)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4516
 * @param len             register containing number of bytes
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4517
 * @param constants       register pointing to CRC table for 128-bit aligned memory
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4518
 * @param barretConstants register pointing to table for barrett reduction
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4519
 * @param t0              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4520
 * @param t1              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4521
 * @param t2              volatile register
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4522
 */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4523
void MacroAssembler::kernel_crc32_1word_aligned(Register crc, Register buf, Register len,
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4524
    Register constants, Register barretConstants, Register t0, Register t1, Register t2) {
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4525
  Label L_mainLoop, L_tail, L_alignTail, L_barrett_reduction, L_end, L_first_warm_up_done, L_first_cool_down, L_second_cool_down, L_XOR, L_test;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4526
  Label L_lv0, L_lv1, L_lv2, L_lv3, L_lv4, L_lv5, L_lv6, L_lv7, L_lv8, L_lv9, L_lv10, L_lv11, L_lv12, L_lv13, L_lv14, L_lv15;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4527
  Label L_1, L_2, L_3, L_4;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4528
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4529
  Register  rLoaded      = t0;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4530
  Register  rTmp1        = t1;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4531
  Register  rTmp2        = t2;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4532
  Register  off16        = R22;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4533
  Register  off32        = R23;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4534
  Register  off48        = R24;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4535
  Register  off64        = R25;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4536
  Register  off80        = R26;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4537
  Register  off96        = R27;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4538
  Register  off112       = R28;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4539
  Register  rIdx         = R29;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4540
  Register  rMax         = R30;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4541
  Register  constantsPos = R31;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4542
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4543
  VectorRegister mask_32bit = VR24;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4544
  VectorRegister mask_64bit = VR25;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4545
  VectorRegister zeroes     = VR26;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4546
  VectorRegister const1     = VR27;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4547
  VectorRegister const2     = VR28;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4548
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4549
  // Save non-volatile vector registers (frameless).
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4550
  Register offset = t1;   int offsetInt = 0;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4551
  offsetInt -= 16; li(offset, -16);           stvx(VR20, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4552
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR21, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4553
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR22, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4554
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR23, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4555
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR24, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4556
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR25, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4557
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR26, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4558
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR27, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4559
  offsetInt -= 16; addi(offset, offset, -16); stvx(VR28, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4560
  offsetInt -= 8; std(R22, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4561
  offsetInt -= 8; std(R23, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4562
  offsetInt -= 8; std(R24, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4563
  offsetInt -= 8; std(R25, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4564
  offsetInt -= 8; std(R26, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4565
  offsetInt -= 8; std(R27, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4566
  offsetInt -= 8; std(R28, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4567
  offsetInt -= 8; std(R29, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4568
  offsetInt -= 8; std(R30, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4569
  offsetInt -= 8; std(R31, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4570
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4571
  // Set constants
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4572
  li(off16, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4573
  li(off32, 32);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4574
  li(off48, 48);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4575
  li(off64, 64);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4576
  li(off80, 80);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4577
  li(off96, 96);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4578
  li(off112, 112);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4579
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4580
  clrldi(crc, crc, 32);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4581
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4582
  vxor(zeroes, zeroes, zeroes);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4583
  vspltisw(VR0, -1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4584
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4585
  vsldoi(mask_32bit, zeroes, VR0, 4);
46789
1bf8c1e8b79a 8185975: PPC64: Fix vsldoi interface according to the ISA
mdoerr
parents: 46494
diff changeset
  4586
  vsldoi(mask_64bit, zeroes, VR0, 8);
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4587
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4588
  // Get the initial value into v8
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4589
  vxor(VR8, VR8, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4590
  mtvrd(VR8, crc);
46789
1bf8c1e8b79a 8185975: PPC64: Fix vsldoi interface according to the ISA
mdoerr
parents: 46494
diff changeset
  4591
  vsldoi(VR8, zeroes, VR8, 8); // shift into bottom 32 bits
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4592
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4593
  li (rLoaded, 0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4594
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4595
  rldicr(rIdx, len, 0, 56);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4596
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4597
  {
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4598
    BIND(L_1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4599
    // Checksum in blocks of MAX_SIZE (32768)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4600
    lis(rMax, 0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4601
    ori(rMax, rMax, 32768);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4602
    mr(rTmp2, rMax);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4603
    cmpd(CCR0, rIdx, rMax);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4604
    bgt(CCR0, L_2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4605
    mr(rMax, rIdx);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4606
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4607
    BIND(L_2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4608
    subf(rIdx, rMax, rIdx);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4609
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4610
    // our main loop does 128 bytes at a time
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4611
    srdi(rMax, rMax, 7);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4612
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4613
    /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4614
     * Work out the offset into the constants table to start at. Each
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4615
     * constant is 16 bytes, and it is used against 128 bytes of input
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4616
     * data - 128 / 16 = 8
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4617
     */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4618
    sldi(rTmp1, rMax, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4619
    srdi(rTmp2, rTmp2, 3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4620
    subf(rTmp1, rTmp1, rTmp2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4621
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4622
    // We reduce our final 128 bytes in a separate step
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4623
    addi(rMax, rMax, -1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4624
    mtctr(rMax);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4625
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4626
    // Find the start of our constants
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4627
    add(constantsPos, constants, rTmp1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4628
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4629
    // zero VR0-v7 which will contain our checksums
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4630
    vxor(VR0, VR0, VR0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4631
    vxor(VR1, VR1, VR1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4632
    vxor(VR2, VR2, VR2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4633
    vxor(VR3, VR3, VR3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4634
    vxor(VR4, VR4, VR4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4635
    vxor(VR5, VR5, VR5);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4636
    vxor(VR6, VR6, VR6);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4637
    vxor(VR7, VR7, VR7);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4638
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4639
    lvx(const1, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4640
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4641
    /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4642
     * If we are looping back to consume more data we use the values
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4643
     * already in VR16-v23.
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4644
     */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4645
    cmpdi(CCR0, rLoaded, 1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4646
    beq(CCR0, L_3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4647
    {
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4648
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4649
      // First warm up pass
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4650
      lvx(VR16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4651
      lvx(VR17, off16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4652
      lvx(VR18, off32, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4653
      lvx(VR19, off48, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4654
      lvx(VR20, off64, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4655
      lvx(VR21, off80, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4656
      lvx(VR22, off96, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4657
      lvx(VR23, off112, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4658
      addi(buf, buf, 8*16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4659
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4660
      // xor in initial value
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4661
      vxor(VR16, VR16, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4662
    }
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4663
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4664
    BIND(L_3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4665
    bdz(L_first_warm_up_done);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4666
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4667
    addi(constantsPos, constantsPos, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4668
    lvx(const2, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4669
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4670
    // Second warm up pass
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4671
    vpmsumd(VR8, VR16, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4672
    lvx(VR16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4673
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4674
    vpmsumd(VR9, VR17, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4675
    lvx(VR17, off16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4676
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4677
    vpmsumd(VR10, VR18, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4678
    lvx(VR18, off32, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4679
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4680
    vpmsumd(VR11, VR19, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4681
    lvx(VR19, off48, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4682
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4683
    vpmsumd(VR12, VR20, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4684
    lvx(VR20, off64, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4685
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4686
    vpmsumd(VR13, VR21, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4687
    lvx(VR21, off80, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4688
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4689
    vpmsumd(VR14, VR22, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4690
    lvx(VR22, off96, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4691
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4692
    vpmsumd(VR15, VR23, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4693
    lvx(VR23, off112, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4694
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4695
    addi(buf, buf, 8 * 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4696
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4697
    bdz(L_first_cool_down);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4698
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4699
    /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4700
     * main loop. We modulo schedule it such that it takes three iterations
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4701
     * to complete - first iteration load, second iteration vpmsum, third
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4702
     * iteration xor.
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4703
     */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4704
    {
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4705
      BIND(L_4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4706
      lvx(const1, constantsPos); addi(constantsPos, constantsPos, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4707
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4708
      vxor(VR0, VR0, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4709
      vpmsumd(VR8, VR16, const2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4710
      lvx(VR16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4711
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4712
      vxor(VR1, VR1, VR9);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4713
      vpmsumd(VR9, VR17, const2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4714
      lvx(VR17, off16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4715
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4716
      vxor(VR2, VR2, VR10);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4717
      vpmsumd(VR10, VR18, const2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4718
      lvx(VR18, off32, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4719
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4720
      vxor(VR3, VR3, VR11);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4721
      vpmsumd(VR11, VR19, const2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4722
      lvx(VR19, off48, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4723
      lvx(const2, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4724
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4725
      vxor(VR4, VR4, VR12);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4726
      vpmsumd(VR12, VR20, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4727
      lvx(VR20, off64, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4728
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4729
      vxor(VR5, VR5, VR13);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4730
      vpmsumd(VR13, VR21, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4731
      lvx(VR21, off80, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4732
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4733
      vxor(VR6, VR6, VR14);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4734
      vpmsumd(VR14, VR22, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4735
      lvx(VR22, off96, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4736
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4737
      vxor(VR7, VR7, VR15);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4738
      vpmsumd(VR15, VR23, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4739
      lvx(VR23, off112, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4740
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4741
      addi(buf, buf, 8 * 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4742
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4743
      bdnz(L_4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4744
    }
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4745
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4746
    BIND(L_first_cool_down);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4747
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4748
    // First cool down pass
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4749
    lvx(const1, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4750
    addi(constantsPos, constantsPos, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4751
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4752
    vxor(VR0, VR0, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4753
    vpmsumd(VR8, VR16, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4754
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4755
    vxor(VR1, VR1, VR9);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4756
    vpmsumd(VR9, VR17, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4757
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4758
    vxor(VR2, VR2, VR10);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4759
    vpmsumd(VR10, VR18, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4760
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4761
    vxor(VR3, VR3, VR11);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4762
    vpmsumd(VR11, VR19, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4763
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4764
    vxor(VR4, VR4, VR12);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4765
    vpmsumd(VR12, VR20, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4766
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4767
    vxor(VR5, VR5, VR13);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4768
    vpmsumd(VR13, VR21, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4769
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4770
    vxor(VR6, VR6, VR14);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4771
    vpmsumd(VR14, VR22, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4772
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4773
    vxor(VR7, VR7, VR15);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4774
    vpmsumd(VR15, VR23, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4775
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4776
    BIND(L_second_cool_down);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4777
    // Second cool down pass
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4778
    vxor(VR0, VR0, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4779
    vxor(VR1, VR1, VR9);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4780
    vxor(VR2, VR2, VR10);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4781
    vxor(VR3, VR3, VR11);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4782
    vxor(VR4, VR4, VR12);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4783
    vxor(VR5, VR5, VR13);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4784
    vxor(VR6, VR6, VR14);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4785
    vxor(VR7, VR7, VR15);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4786
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4787
    /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4788
     * vpmsumd produces a 96 bit result in the least significant bits
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4789
     * of the register. Since we are bit reflected we have to shift it
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4790
     * left 32 bits so it occupies the least significant bits in the
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4791
     * bit reflected domain.
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4792
     */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4793
    vsldoi(VR0, VR0, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4794
    vsldoi(VR1, VR1, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4795
    vsldoi(VR2, VR2, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4796
    vsldoi(VR3, VR3, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4797
    vsldoi(VR4, VR4, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4798
    vsldoi(VR5, VR5, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4799
    vsldoi(VR6, VR6, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4800
    vsldoi(VR7, VR7, zeroes, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4801
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4802
    // xor with last 1024 bits
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4803
    lvx(VR8, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4804
    lvx(VR9, off16, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4805
    lvx(VR10, off32, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4806
    lvx(VR11, off48, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4807
    lvx(VR12, off64, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4808
    lvx(VR13, off80, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4809
    lvx(VR14, off96, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4810
    lvx(VR15, off112, buf);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4811
    addi(buf, buf, 8 * 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4812
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4813
    vxor(VR16, VR0, VR8);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4814
    vxor(VR17, VR1, VR9);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4815
    vxor(VR18, VR2, VR10);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4816
    vxor(VR19, VR3, VR11);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4817
    vxor(VR20, VR4, VR12);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4818
    vxor(VR21, VR5, VR13);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4819
    vxor(VR22, VR6, VR14);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4820
    vxor(VR23, VR7, VR15);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4821
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4822
    li(rLoaded, 1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4823
    cmpdi(CCR0, rIdx, 0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4824
    addi(rIdx, rIdx, 128);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4825
    bne(CCR0, L_1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4826
  }
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4827
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4828
  // Work out how many bytes we have left
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4829
  andi_(len, len, 127);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4830
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4831
  // Calculate where in the constant table we need to start
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4832
  subfic(rTmp1, len, 128);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4833
  add(constantsPos, constantsPos, rTmp1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4834
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4835
  // How many 16 byte chunks are in the tail
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4836
  srdi(rIdx, len, 4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4837
  mtctr(rIdx);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4838
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4839
  /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4840
   * Reduce the previously calculated 1024 bits to 64 bits, shifting
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4841
   * 32 bits to include the trailing 32 bits of zeros
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4842
   */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4843
  lvx(VR0, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4844
  lvx(VR1, off16, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4845
  lvx(VR2, off32, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4846
  lvx(VR3, off48, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4847
  lvx(VR4, off64, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4848
  lvx(VR5, off80, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4849
  lvx(VR6, off96, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4850
  lvx(VR7, off112, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4851
  addi(constantsPos, constantsPos, 8 * 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4852
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4853
  vpmsumw(VR0, VR16, VR0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4854
  vpmsumw(VR1, VR17, VR1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4855
  vpmsumw(VR2, VR18, VR2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4856
  vpmsumw(VR3, VR19, VR3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4857
  vpmsumw(VR4, VR20, VR4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4858
  vpmsumw(VR5, VR21, VR5);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4859
  vpmsumw(VR6, VR22, VR6);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4860
  vpmsumw(VR7, VR23, VR7);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4861
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4862
  // Now reduce the tail (0 - 112 bytes)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4863
  cmpdi(CCR0, rIdx, 0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4864
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4865
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4866
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4867
  lvx(VR17, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4868
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4869
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4870
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4871
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4872
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4873
  lvx(VR17, off16, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4874
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4875
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4876
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4877
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4878
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4879
  lvx(VR17, off32, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4880
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4881
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4882
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4883
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4884
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4885
  lvx(VR17, off48,constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4886
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4887
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4888
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4889
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4890
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4891
  lvx(VR17, off64, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4892
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4893
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4894
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4895
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4896
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4897
  lvx(VR17, off80, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4898
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4899
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4900
  beq(CCR0, L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4901
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4902
  lvx(VR16, buf); addi(buf, buf, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4903
  lvx(VR17, off96, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4904
  vpmsumw(VR16, VR16, VR17);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4905
  vxor(VR0, VR0, VR16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4906
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4907
  // Now xor all the parallel chunks together
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4908
  BIND(L_XOR);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4909
  vxor(VR0, VR0, VR1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4910
  vxor(VR2, VR2, VR3);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4911
  vxor(VR4, VR4, VR5);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4912
  vxor(VR6, VR6, VR7);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4913
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4914
  vxor(VR0, VR0, VR2);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4915
  vxor(VR4, VR4, VR6);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4916
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4917
  vxor(VR0, VR0, VR4);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4918
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4919
  b(L_barrett_reduction);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4920
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4921
  BIND(L_first_warm_up_done);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4922
  lvx(const1, constantsPos);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4923
  addi(constantsPos, constantsPos, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4924
  vpmsumd(VR8,  VR16, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4925
  vpmsumd(VR9,  VR17, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4926
  vpmsumd(VR10, VR18, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4927
  vpmsumd(VR11, VR19, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4928
  vpmsumd(VR12, VR20, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4929
  vpmsumd(VR13, VR21, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4930
  vpmsumd(VR14, VR22, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4931
  vpmsumd(VR15, VR23, const1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4932
  b(L_second_cool_down);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4933
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4934
  BIND(L_barrett_reduction);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4935
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4936
  lvx(const1, barretConstants);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4937
  addi(barretConstants, barretConstants, 16);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4938
  lvx(const2, barretConstants);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4939
46789
1bf8c1e8b79a 8185975: PPC64: Fix vsldoi interface according to the ISA
mdoerr
parents: 46494
diff changeset
  4940
  vsldoi(VR1, VR0, VR0, 8);
41334
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4941
  vxor(VR0, VR0, VR1);    // xor two 64 bit results together
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4942
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4943
  // shift left one bit
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4944
  vspltisb(VR1, 1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4945
  vsl(VR0, VR0, VR1);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4946
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4947
  vand(VR0, VR0, mask_64bit);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4948
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4949
  /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4950
   * The reflected version of Barrett reduction. Instead of bit
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4951
   * reflecting our data (which is expensive to do), we bit reflect our
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4952
   * constants and our algorithm, which means the intermediate data in
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4953
   * our vector registers goes from 0-63 instead of 63-0. We can reflect
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4954
   * the algorithm because we don't carry in mod 2 arithmetic.
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4955
   */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4956
  vand(VR1, VR0, mask_32bit);  // bottom 32 bits of a
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4957
  vpmsumd(VR1, VR1, const1);   // ma
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4958
  vand(VR1, VR1, mask_32bit);  // bottom 32bits of ma
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4959
  vpmsumd(VR1, VR1, const2);   // qn */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4960
  vxor(VR0, VR0, VR1);         // a - qn, subtraction is xor in GF(2)
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4961
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4962
  /*
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4963
   * Since we are bit reflected, the result (ie the low 32 bits) is in
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4964
   * the high 32 bits. We just need to shift it left 4 bytes
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4965
   * V0 [ 0 1 X 3 ]
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4966
   * V0 [ 0 X 2 3 ]
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4967
   */
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4968
  vsldoi(VR0, VR0, zeroes, 4);    // shift result into top 64 bits of
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4969
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4970
  // Get it into r3
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4971
  mfvrd(crc, VR0);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4972
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4973
  BIND(L_end);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4974
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4975
  offsetInt = 0;
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4976
  // Restore non-volatile Vector registers (frameless).
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4977
  offsetInt -= 16; li(offset, -16);           lvx(VR20, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4978
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR21, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4979
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR22, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4980
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR23, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4981
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR24, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4982
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR25, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4983
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR26, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4984
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR27, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4985
  offsetInt -= 16; addi(offset, offset, -16); lvx(VR28, offset, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4986
  offsetInt -= 8;  ld(R22, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4987
  offsetInt -= 8;  ld(R23, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4988
  offsetInt -= 8;  ld(R24, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4989
  offsetInt -= 8;  ld(R25, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4990
  offsetInt -= 8;  ld(R26, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4991
  offsetInt -= 8;  ld(R27, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4992
  offsetInt -= 8;  ld(R28, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4993
  offsetInt -= 8;  ld(R29, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4994
  offsetInt -= 8;  ld(R30, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4995
  offsetInt -= 8;  ld(R31, offsetInt, R1_SP);
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4996
}
8b28be7b8613 8164920: ppc: enhancement of CRC32 intrinsic
mdoerr
parents: 39444
diff changeset
  4997
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  4998
void MacroAssembler::kernel_crc32_singleByte(Register crc, Register buf, Register len, Register table, Register tmp, bool invertCRC) {
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  4999
  assert_different_registers(crc, buf, /* len,  not used!! */ table, tmp);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5000
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5001
  BLOCK_COMMENT("kernel_crc32_singleByte:");
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5002
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5003
    nand(crc, crc, crc);                // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5004
  }
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5005
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5006
  lbz(tmp, 0, buf);                     // Byte from buffer, zero-extended.
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5007
  update_byte_crc32(crc, tmp, table);
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5008
46317
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5009
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5010
    nand(crc, crc, crc);                // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5011
  }
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5012
}
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5013
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5014
void MacroAssembler::kernel_crc32_singleByteReg(Register crc, Register val, Register table, bool invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5015
  assert_different_registers(crc, val, table);
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5016
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5017
  BLOCK_COMMENT("kernel_crc32_singleByteReg:");
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5018
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5019
    nand(crc, crc, crc);                // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5020
  }
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5021
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5022
  update_byte_crc32(crc, val, table);
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5023
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5024
  if (invertCRC) {
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5025
    nand(crc, crc, crc);                // 1s complement of crc
5f88747fe29e 8175369: [ppc] Provide intrinsic implementation for CRC32C
lucy
parents: 43428
diff changeset
  5026
  }
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5027
}
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5028
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5029
// dest_lo += src1 + src2
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5030
// dest_hi += carry1 + carry2
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5031
void MacroAssembler::add2_with_carry(Register dest_hi,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5032
                                     Register dest_lo,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5033
                                     Register src1, Register src2) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5034
  li(R0, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5035
  addc(dest_lo, dest_lo, src1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5036
  adde(dest_hi, dest_hi, R0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5037
  addc(dest_lo, dest_lo, src2);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5038
  adde(dest_hi, dest_hi, R0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5039
}
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5040
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5041
// Multiply 64 bit by 64 bit first loop.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5042
void MacroAssembler::multiply_64_x_64_loop(Register x, Register xstart,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5043
                                           Register x_xstart,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5044
                                           Register y, Register y_idx,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5045
                                           Register z,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5046
                                           Register carry,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5047
                                           Register product_high, Register product,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5048
                                           Register idx, Register kdx,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5049
                                           Register tmp) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5050
  //  jlong carry, x[], y[], z[];
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5051
  //  for (int idx=ystart, kdx=ystart+1+xstart; idx >= 0; idx--, kdx--) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5052
  //    huge_128 product = y[idx] * x[xstart] + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5053
  //    z[kdx] = (jlong)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5054
  //    carry  = (jlong)(product >>> 64);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5055
  //  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5056
  //  z[xstart] = carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5057
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5058
  Label L_first_loop, L_first_loop_exit;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5059
  Label L_one_x, L_one_y, L_multiply;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5060
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5061
  addic_(xstart, xstart, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5062
  blt(CCR0, L_one_x);   // Special case: length of x is 1.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5063
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5064
  // Load next two integers of x.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5065
  sldi(tmp, xstart, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5066
  ldx(x_xstart, x, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5067
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5068
  rldicl(x_xstart, x_xstart, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5069
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5070
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5071
  align(32, 16);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5072
  bind(L_first_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5073
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5074
  cmpdi(CCR0, idx, 1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5075
  blt(CCR0, L_first_loop_exit);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5076
  addi(idx, idx, -2);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5077
  beq(CCR0, L_one_y);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5078
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5079
  // Load next two integers of y.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5080
  sldi(tmp, idx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5081
  ldx(y_idx, y, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5082
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5083
  rldicl(y_idx, y_idx, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5084
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5085
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5086
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5087
  bind(L_multiply);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5088
  multiply64(product_high, product, x_xstart, y_idx);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5089
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5090
  li(tmp, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5091
  addc(product, product, carry);         // Add carry to result.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5092
  adde(product_high, product_high, tmp); // Add carry of the last addition.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5093
  addi(kdx, kdx, -2);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5094
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5095
  // Store result.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5096
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5097
  rldicl(product, product, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5098
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5099
  sldi(tmp, kdx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5100
  stdx(product, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5101
  mr_if_needed(carry, product_high);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5102
  b(L_first_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5103
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5104
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5105
  bind(L_one_y); // Load one 32 bit portion of y as (0,value).
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5106
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5107
  lwz(y_idx, 0, y);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5108
  b(L_multiply);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5109
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5110
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5111
  bind(L_one_x); // Load one 32 bit portion of x as (0,value).
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5112
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5113
  lwz(x_xstart, 0, x);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5114
  b(L_first_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5115
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5116
  bind(L_first_loop_exit);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5117
}
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5118
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5119
// Multiply 64 bit by 64 bit and add 128 bit.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5120
void MacroAssembler::multiply_add_128_x_128(Register x_xstart, Register y,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5121
                                            Register z, Register yz_idx,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5122
                                            Register idx, Register carry,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5123
                                            Register product_high, Register product,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5124
                                            Register tmp, int offset) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5125
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5126
  //  huge_128 product = (y[idx] * x_xstart) + z[kdx] + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5127
  //  z[kdx] = (jlong)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5128
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5129
  sldi(tmp, idx, LogBytesPerInt);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5130
  if (offset) {
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5131
    addi(tmp, tmp, offset);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5132
  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5133
  ldx(yz_idx, y, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5134
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5135
  rldicl(yz_idx, yz_idx, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5136
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5137
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5138
  multiply64(product_high, product, x_xstart, yz_idx);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5139
  ldx(yz_idx, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5140
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5141
  rldicl(yz_idx, yz_idx, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5142
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5143
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5144
  add2_with_carry(product_high, product, carry, yz_idx);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5145
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5146
  sldi(tmp, idx, LogBytesPerInt);
31861
7efea6fae96b 8131048: ppc: implement CRC32 intrinsic
goetz
parents: 31773
diff changeset
  5147
  if (offset) {
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5148
    addi(tmp, tmp, offset);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5149
  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5150
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5151
  rldicl(product, product, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5152
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5153
  stdx(product, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5154
}
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5155
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5156
// Multiply 128 bit by 128 bit. Unrolled inner loop.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5157
void MacroAssembler::multiply_128_x_128_loop(Register x_xstart,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5158
                                             Register y, Register z,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5159
                                             Register yz_idx, Register idx, Register carry,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5160
                                             Register product_high, Register product,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5161
                                             Register carry2, Register tmp) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5162
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5163
  //  jlong carry, x[], y[], z[];
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5164
  //  int kdx = ystart+1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5165
  //  for (int idx=ystart-2; idx >= 0; idx -= 2) { // Third loop
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5166
  //    huge_128 product = (y[idx+1] * x_xstart) + z[kdx+idx+1] + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5167
  //    z[kdx+idx+1] = (jlong)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5168
  //    jlong carry2 = (jlong)(product >>> 64);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5169
  //    product = (y[idx] * x_xstart) + z[kdx+idx] + carry2;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5170
  //    z[kdx+idx] = (jlong)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5171
  //    carry = (jlong)(product >>> 64);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5172
  //  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5173
  //  idx += 2;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5174
  //  if (idx > 0) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5175
  //    product = (y[idx] * x_xstart) + z[kdx+idx] + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5176
  //    z[kdx+idx] = (jlong)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5177
  //    carry = (jlong)(product >>> 64);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5178
  //  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5179
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5180
  Label L_third_loop, L_third_loop_exit, L_post_third_loop_done;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5181
  const Register jdx = R0;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5182
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5183
  // Scale the index.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5184
  srdi_(jdx, idx, 2);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5185
  beq(CCR0, L_third_loop_exit);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5186
  mtctr(jdx);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5187
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5188
  align(32, 16);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5189
  bind(L_third_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5190
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5191
  addi(idx, idx, -4);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5192
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5193
  multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry, product_high, product, tmp, 8);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5194
  mr_if_needed(carry2, product_high);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5195
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5196
  multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry2, product_high, product, tmp, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5197
  mr_if_needed(carry, product_high);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5198
  bdnz(L_third_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5199
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5200
  bind(L_third_loop_exit);  // Handle any left-over operand parts.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5201
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5202
  andi_(idx, idx, 0x3);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5203
  beq(CCR0, L_post_third_loop_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5204
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5205
  Label L_check_1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5206
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5207
  addic_(idx, idx, -2);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5208
  blt(CCR0, L_check_1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5209
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5210
  multiply_add_128_x_128(x_xstart, y, z, yz_idx, idx, carry, product_high, product, tmp, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5211
  mr_if_needed(carry, product_high);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5212
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5213
  bind(L_check_1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5214
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5215
  addi(idx, idx, 0x2);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5216
  andi_(idx, idx, 0x1);
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5217
  addic_(idx, idx, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5218
  blt(CCR0, L_post_third_loop_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5219
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5220
  sldi(tmp, idx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5221
  lwzx(yz_idx, y, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5222
  multiply64(product_high, product, x_xstart, yz_idx);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5223
  lwzx(yz_idx, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5224
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5225
  add2_with_carry(product_high, product, yz_idx, carry);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5226
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5227
  sldi(tmp, idx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5228
  stwx(product, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5229
  srdi(product, product, 32);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5230
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5231
  sldi(product_high, product_high, 32);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5232
  orr(product, product, product_high);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5233
  mr_if_needed(carry, product);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5234
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5235
  bind(L_post_third_loop_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5236
}   // multiply_128_x_128_loop
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5237
47521
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5238
void MacroAssembler::muladd(Register out, Register in,
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5239
                            Register offset, Register len, Register k,
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5240
                            Register tmp1, Register tmp2, Register carry) {
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5241
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5242
  // Labels
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5243
  Label LOOP, SKIP;
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5244
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5245
  // Make sure length is positive.
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5246
  cmpdi  (CCR0,    len,     0);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5247
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5248
  // Prepare variables
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5249
  subi   (offset,  offset,  4);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5250
  li     (carry,   0);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5251
  ble    (CCR0,    SKIP);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5252
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5253
  mtctr  (len);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5254
  subi   (len,     len,     1    );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5255
  sldi   (len,     len,     2    );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5256
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5257
  // Main loop
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5258
  bind(LOOP);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5259
  lwzx   (tmp1,    len,     in   );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5260
  lwzx   (tmp2,    offset,  out  );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5261
  mulld  (tmp1,    tmp1,    k    );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5262
  add    (tmp2,    carry,   tmp2 );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5263
  add    (tmp2,    tmp1,    tmp2 );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5264
  stwx   (tmp2,    offset,  out  );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5265
  srdi   (carry,   tmp2,    32   );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5266
  subi   (offset,  offset,  4    );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5267
  subi   (len,     len,     4    );
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5268
  bdnz   (LOOP);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5269
  bind(SKIP);
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5270
}
122833427b36 8185976: PPC64: Implement MulAdd and SquareToLen intrinsics
goetz
parents: 47520
diff changeset
  5271
31773
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5272
void MacroAssembler::multiply_to_len(Register x, Register xlen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5273
                                     Register y, Register ylen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5274
                                     Register z, Register zlen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5275
                                     Register tmp1, Register tmp2,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5276
                                     Register tmp3, Register tmp4,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5277
                                     Register tmp5, Register tmp6,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5278
                                     Register tmp7, Register tmp8,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5279
                                     Register tmp9, Register tmp10,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5280
                                     Register tmp11, Register tmp12,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5281
                                     Register tmp13) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5282
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5283
  ShortBranchVerifier sbv(this);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5284
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5285
  assert_different_registers(x, xlen, y, ylen, z, zlen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5286
                             tmp1, tmp2, tmp3, tmp4, tmp5, tmp6);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5287
  assert_different_registers(x, xlen, y, ylen, z, zlen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5288
                             tmp1, tmp2, tmp3, tmp4, tmp5, tmp7);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5289
  assert_different_registers(x, xlen, y, ylen, z, zlen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5290
                             tmp1, tmp2, tmp3, tmp4, tmp5, tmp8);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5291
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5292
  const Register idx = tmp1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5293
  const Register kdx = tmp2;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5294
  const Register xstart = tmp3;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5295
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5296
  const Register y_idx = tmp4;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5297
  const Register carry = tmp5;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5298
  const Register product = tmp6;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5299
  const Register product_high = tmp7;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5300
  const Register x_xstart = tmp8;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5301
  const Register tmp = tmp9;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5302
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5303
  // First Loop.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5304
  //
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5305
  //  final static long LONG_MASK = 0xffffffffL;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5306
  //  int xstart = xlen - 1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5307
  //  int ystart = ylen - 1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5308
  //  long carry = 0;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5309
  //  for (int idx=ystart, kdx=ystart+1+xstart; idx >= 0; idx-, kdx--) {
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5310
  //    long product = (y[idx] & LONG_MASK) * (x[xstart] & LONG_MASK) + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5311
  //    z[kdx] = (int)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5312
  //    carry = product >>> 32;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5313
  //  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5314
  //  z[xstart] = (int)carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5315
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5316
  mr_if_needed(idx, ylen);        // idx = ylen
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5317
  mr_if_needed(kdx, zlen);        // kdx = xlen + ylen
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5318
  li(carry, 0);                   // carry = 0
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5319
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5320
  Label L_done;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5321
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5322
  addic_(xstart, xlen, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5323
  blt(CCR0, L_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5324
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5325
  multiply_64_x_64_loop(x, xstart, x_xstart, y, y_idx, z,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5326
                        carry, product_high, product, idx, kdx, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5327
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5328
  Label L_second_loop;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5329
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5330
  cmpdi(CCR0, kdx, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5331
  beq(CCR0, L_second_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5332
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5333
  Label L_carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5334
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5335
  addic_(kdx, kdx, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5336
  beq(CCR0, L_carry);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5337
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5338
  // Store lower 32 bits of carry.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5339
  sldi(tmp, kdx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5340
  stwx(carry, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5341
  srdi(carry, carry, 32);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5342
  addi(kdx, kdx, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5343
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5344
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5345
  bind(L_carry);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5346
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5347
  // Store upper 32 bits of carry.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5348
  sldi(tmp, kdx, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5349
  stwx(carry, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5350
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5351
  // Second and third (nested) loops.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5352
  //
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5353
  //  for (int i = xstart-1; i >= 0; i--) { // Second loop
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5354
  //    carry = 0;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5355
  //    for (int jdx=ystart, k=ystart+1+i; jdx >= 0; jdx--, k--) { // Third loop
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5356
  //      long product = (y[jdx] & LONG_MASK) * (x[i] & LONG_MASK) +
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5357
  //                     (z[k] & LONG_MASK) + carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5358
  //      z[k] = (int)product;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5359
  //      carry = product >>> 32;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5360
  //    }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5361
  //    z[i] = (int)carry;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5362
  //  }
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5363
  //
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5364
  //  i = xlen, j = tmp1, k = tmp2, carry = tmp5, x[i] = rdx
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5365
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5366
  bind(L_second_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5367
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5368
  li(carry, 0);                   // carry = 0;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5369
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5370
  addic_(xstart, xstart, -1);     // i = xstart-1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5371
  blt(CCR0, L_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5372
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5373
  Register zsave = tmp10;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5374
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5375
  mr(zsave, z);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5376
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5377
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5378
  Label L_last_x;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5379
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5380
  sldi(tmp, xstart, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5381
  add(z, z, tmp);                 // z = z + k - j
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5382
  addi(z, z, 4);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5383
  addic_(xstart, xstart, -1);     // i = xstart-1;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5384
  blt(CCR0, L_last_x);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5385
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5386
  sldi(tmp, xstart, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5387
  ldx(x_xstart, x, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5388
#ifdef VM_LITTLE_ENDIAN
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5389
  rldicl(x_xstart, x_xstart, 32, 0);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5390
#endif
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5391
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5392
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5393
  Label L_third_loop_prologue;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5394
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5395
  bind(L_third_loop_prologue);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5396
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5397
  Register xsave = tmp11;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5398
  Register xlensave = tmp12;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5399
  Register ylensave = tmp13;
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5400
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5401
  mr(xsave, x);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5402
  mr(xlensave, xstart);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5403
  mr(ylensave, ylen);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5404
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5405
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5406
  multiply_128_x_128_loop(x_xstart, y, z, y_idx, ylen,
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5407
                          carry, product_high, product, x, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5408
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5409
  mr(z, zsave);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5410
  mr(x, xsave);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5411
  mr(xlen, xlensave);   // This is the decrement of the loop counter!
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5412
  mr(ylen, ylensave);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5413
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5414
  addi(tmp3, xlen, 1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5415
  sldi(tmp, tmp3, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5416
  stwx(carry, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5417
  addic_(tmp3, tmp3, -1);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5418
  blt(CCR0, L_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5419
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5420
  srdi(carry, carry, 32);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5421
  sldi(tmp, tmp3, LogBytesPerInt);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5422
  stwx(carry, z, tmp);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5423
  b(L_second_loop);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5424
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5425
  // Next infrequent code is moved outside loops.
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5426
  bind(L_last_x);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5427
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5428
  lwz(x_xstart, 0, x);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5429
  b(L_third_loop_prologue);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5430
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5431
  bind(L_done);
f874931cbae7 8130653: ppc: implement MultiplyToLen intrinsic
goetz
parents: 30764
diff changeset
  5432
}   // multiply_to_len
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5433
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5434
void MacroAssembler::asm_assert(bool check_equal, const char *msg, int id) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5435
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5436
  Label ok;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5437
  if (check_equal) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5438
    beq(CCR0, ok);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5439
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5440
    bne(CCR0, ok);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5441
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5442
  stop(msg, id);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5443
  bind(ok);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5444
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5445
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5446
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5447
void MacroAssembler::asm_assert_mems_zero(bool check_equal, int size, int mem_offset,
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5448
                                          Register mem_base, const char* msg, int id) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5449
#ifdef ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5450
  switch (size) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5451
    case 4:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5452
      lwz(R0, mem_offset, mem_base);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5453
      cmpwi(CCR0, R0, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5454
      break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5455
    case 8:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5456
      ld(R0, mem_offset, mem_base);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5457
      cmpdi(CCR0, R0, 0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5458
      break;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5459
    default:
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5460
      ShouldNotReachHere();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5461
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5462
  asm_assert(check_equal, msg, id);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5463
#endif // ASSERT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5464
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5465
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5466
void MacroAssembler::verify_thread() {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5467
  if (VerifyThread) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5468
    unimplemented("'VerifyThread' currently not implemented on PPC");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5469
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5470
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5471
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5472
// READ: oop. KILL: R0. Volatile floats perhaps.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5473
void MacroAssembler::verify_oop(Register oop, const char* msg) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5474
  if (!VerifyOops) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5475
    return;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5476
  }
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5477
22861
f5c393d456fc 8029940: PPC64 (part 122): C2 compiler port
goetz
parents: 22852
diff changeset
  5478
  address/* FunctionDescriptor** */fd = StubRoutines::verify_oop_subroutine_entry_address();
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5479
  const Register tmp = R11; // Will be preserved.
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5480
  const int nbytes_save = MacroAssembler::num_volatile_regs * 8;
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5481
  save_volatile_gprs(R1_SP, -nbytes_save); // except R0
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5482
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5483
  mr_if_needed(R4_ARG2, oop);
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5484
  save_LR_CR(tmp); // save in old frame
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  5485
  push_frame_reg_args(nbytes_save, tmp);
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  5486
  // load FunctionDescriptor** / entry_address *
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5487
  load_const_optimized(tmp, fd, R0);
23211
954e3a81da29 8035647: PPC64: Support for elf v2 abi.
goetz
parents: 22867
diff changeset
  5488
  // load FunctionDescriptor* / entry_address
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5489
  ld(tmp, 0, tmp);
35085
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5490
  load_const_optimized(R3_ARG1, (address)msg, R0);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5491
  // Call destination for its side effect.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5492
  call_c(tmp);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5493
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5494
  pop_frame();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5495
  restore_LR_CR(tmp);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5496
  restore_volatile_gprs(R1_SP, -nbytes_save); // except R0
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5497
}
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5498
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5499
void MacroAssembler::verify_oop_addr(RegisterOrConstant offs, Register base, const char* msg) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5500
  if (!VerifyOops) {
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5501
    return;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5502
  }
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5503
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5504
  address/* FunctionDescriptor** */fd = StubRoutines::verify_oop_subroutine_entry_address();
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5505
  const Register tmp = R11; // Will be preserved.
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5506
  const int nbytes_save = MacroAssembler::num_volatile_regs * 8;
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5507
  save_volatile_gprs(R1_SP, -nbytes_save); // except R0
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5508
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5509
  ld(R4_ARG2, offs, base);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5510
  save_LR_CR(tmp); // save in old frame
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5511
  push_frame_reg_args(nbytes_save, tmp);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5512
  // load FunctionDescriptor** / entry_address *
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5513
  load_const_optimized(tmp, fd, R0);
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5514
  // load FunctionDescriptor* / entry_address
839c8ba29724 8144019: PPC64 C1: Introduce Client Compiler
mdoerr
parents: 34148
diff changeset
  5515
  ld(tmp, 0, tmp);
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5516
  load_const_optimized(R3_ARG1, (address)msg, R0);
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5517
  // Call destination for its side effect.
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5518
  call_c(tmp);
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5519
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5520
  pop_frame();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5521
  restore_LR_CR(tmp);
28187
fc19df82d6ee 8066964: ppc64: argument and return type profiling, fix problem with popframe
goetz
parents: 27012
diff changeset
  5522
  restore_volatile_gprs(R1_SP, -nbytes_save); // except R0
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5523
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5524
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5525
const char* stop_types[] = {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5526
  "stop",
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5527
  "untested",
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5528
  "unimplemented",
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5529
  "shouldnotreachhere"
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5530
};
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5531
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5532
static void stop_on_request(int tp, const char* msg) {
25374
d7fb2af5d53c 8048169: Change 8037816 breaks HS build on PPC64 and CPP-Interpreter platforms
coleenp
parents: 23492
diff changeset
  5533
  tty->print("PPC assembly code requires stop: (%s) %s\n", stop_types[tp%/*stop_end*/4], msg);
33105
294e48b4f704 8080775: Better argument formatting for assert() and friends
david
parents: 32596
diff changeset
  5534
  guarantee(false, "PPC assembly code requires stop: %s", msg);
22824
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5535
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5536
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5537
// Call a C-function that prints output.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5538
void MacroAssembler::stop(int type, const char* msg, int id) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5539
#ifndef PRODUCT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5540
  block_comment(err_msg("stop: %s %s {", stop_types[type%stop_end], msg));
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5541
#else
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5542
  block_comment("stop {");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5543
#endif
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5544
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5545
  // setup arguments
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5546
  load_const_optimized(R3_ARG1, type);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5547
  load_const_optimized(R4_ARG2, (void *)msg, /*tmp=*/R0);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5548
  call_VM_leaf(CAST_FROM_FN_PTR(address, stop_on_request), R3_ARG1, R4_ARG2);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5549
  illtrap();
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5550
  emit_int32(id);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5551
  block_comment("} stop;");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5552
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5553
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5554
#ifndef PRODUCT
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5555
// Write pattern 0x0101010101010101 in memory region [low-before, high+after].
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5556
// Val, addr are temp registers.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5557
// If low == addr, addr is killed.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5558
// High is preserved.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5559
void MacroAssembler::zap_from_to(Register low, int before, Register high, int after, Register val, Register addr) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5560
  if (!ZapMemory) return;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5561
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5562
  assert_different_registers(low, val);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5563
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5564
  BLOCK_COMMENT("zap memory region {");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5565
  load_const_optimized(val, 0x0101010101010101);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5566
  int size = before + after;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5567
  if (low == high && size < 5 && size > 0) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5568
    int offset = -before*BytesPerWord;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5569
    for (int i = 0; i < size; ++i) {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5570
      std(val, offset, low);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5571
      offset += (1*BytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5572
    }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5573
  } else {
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5574
    addi(addr, low, -before*BytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5575
    assert_different_registers(high, val);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5576
    if (after) addi(high, high, after * BytesPerWord);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5577
    Label loop;
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5578
    bind(loop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5579
    std(val, 0, addr);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5580
    addi(addr, addr, 8);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5581
    cmpd(CCR6, addr, high);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5582
    ble(CCR6, loop);
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5583
    if (after) addi(high, high, -after * BytesPerWord);  // Correct back to old value.
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5584
  }
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5585
  BLOCK_COMMENT("} zap memory region");
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5586
}
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5587
28258dd5cb2e 8019972: PPC64 (part 9): platform files for interpreter only VM.
goetz
parents:
diff changeset
  5588
#endif // !PRODUCT
23221
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5589
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5590
SkipIfEqualZero::SkipIfEqualZero(MacroAssembler* masm, Register temp, const bool* flag_addr) : _masm(masm), _label() {
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5591
  int simm16_offset = masm->load_const_optimized(temp, (address)flag_addr, R0, true);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5592
  assert(sizeof(bool) == 1, "PowerPC ABI");
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5593
  masm->lbz(temp, simm16_offset, temp);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5594
  masm->cmpwi(CCR0, temp, 0);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5595
  masm->beq(CCR0, _label);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5596
}
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5597
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5598
SkipIfEqualZero::~SkipIfEqualZero() {
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5599
  _masm->bind(_label);
b70675ece1ce 8036976: PPC64: implement the template interpreter
goetz
parents: 23211
diff changeset
  5600
}