hotspot/src/cpu/x86/vm/c1_LinearScan_x86.hpp
author vdeshpande
Fri, 08 Jan 2016 21:06:50 -0800
changeset 35540 e001ad24dcdb
parent 30624 2e1803c8a26d
child 41331 ec5e0ea52c77
permissions -rw-r--r--
8143353: update for x86 sin and cos in the math lib Summary: Optimize Math.sin() and cos() for 64 and 32 bit X86 architecture using Intel LIBM implementation. Reviewed-by: kvn
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     1
/*
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
     2
 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     4
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
489c9b5090e2 Initial load
duke
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
489c9b5090e2 Initial load
duke
parents:
diff changeset
     7
 * published by the Free Software Foundation.
489c9b5090e2 Initial load
duke
parents:
diff changeset
     8
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
489c9b5090e2 Initial load
duke
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
489c9b5090e2 Initial load
duke
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
489c9b5090e2 Initial load
duke
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
489c9b5090e2 Initial load
duke
parents:
diff changeset
    13
 * accompanied this code).
489c9b5090e2 Initial load
duke
parents:
diff changeset
    14
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
489c9b5090e2 Initial load
duke
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    18
 *
5547
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1217
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1217
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1217
diff changeset
    21
 * questions.
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    22
 *
489c9b5090e2 Initial load
duke
parents:
diff changeset
    23
 */
489c9b5090e2 Initial load
duke
parents:
diff changeset
    24
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    25
#ifndef CPU_X86_VM_C1_LINEARSCAN_X86_HPP
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    26
#define CPU_X86_VM_C1_LINEARSCAN_X86_HPP
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
    27
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    28
inline bool LinearScan::is_processed_reg_num(int reg_num) {
1066
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    29
#ifndef _LP64
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    30
  // rsp and rbp (numbers 6 ancd 7) are ignored
489c9b5090e2 Initial load
duke
parents:
diff changeset
    31
  assert(FrameMap::rsp_opr->cpu_regnr() == 6, "wrong assumption below");
489c9b5090e2 Initial load
duke
parents:
diff changeset
    32
  assert(FrameMap::rbp_opr->cpu_regnr() == 7, "wrong assumption below");
489c9b5090e2 Initial load
duke
parents:
diff changeset
    33
  assert(reg_num >= 0, "invalid reg_num");
1066
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    34
#else
7427
d7b79a367474 6985015: C1 needs to support compressed oops
iveresov
parents: 7397
diff changeset
    35
  // rsp and rbp, r10, r15 (numbers [12,15]) are ignored
d7b79a367474 6985015: C1 needs to support compressed oops
iveresov
parents: 7397
diff changeset
    36
  // r12 (number 11) is conditional on compressed oops.
d7b79a367474 6985015: C1 needs to support compressed oops
iveresov
parents: 7397
diff changeset
    37
  assert(FrameMap::r12_opr->cpu_regnr() == 11, "wrong assumption below");
1066
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    38
  assert(FrameMap::r10_opr->cpu_regnr() == 12, "wrong assumption below");
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    39
  assert(FrameMap::r15_opr->cpu_regnr() == 13, "wrong assumption below");
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    40
  assert(FrameMap::rsp_opr->cpu_regnrLo() == 14, "wrong assumption below");
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    41
  assert(FrameMap::rbp_opr->cpu_regnrLo() == 15, "wrong assumption below");
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    42
  assert(reg_num >= 0, "invalid reg_num");
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    43
#endif // _LP64
7427
d7b79a367474 6985015: C1 needs to support compressed oops
iveresov
parents: 7397
diff changeset
    44
  return reg_num <= FrameMap::last_cpu_reg() || reg_num >= pd_nof_cpu_regs_frame_map;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    45
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    46
489c9b5090e2 Initial load
duke
parents:
diff changeset
    47
inline int LinearScan::num_physical_regs(BasicType type) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    48
  // Intel requires two cpu registers for long,
489c9b5090e2 Initial load
duke
parents:
diff changeset
    49
  // but requires only one fpu register for double
1066
717c3345024f 5108146: Merge i486 and amd64 cpu directories
never
parents: 1
diff changeset
    50
  if (LP64_ONLY(false &&) type == T_LONG) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    51
    return 2;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    52
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    53
  return 1;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    54
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    55
489c9b5090e2 Initial load
duke
parents:
diff changeset
    56
489c9b5090e2 Initial load
duke
parents:
diff changeset
    57
inline bool LinearScan::requires_adjacent_regs(BasicType type) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    58
  return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    59
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    60
489c9b5090e2 Initial load
duke
parents:
diff changeset
    61
inline bool LinearScan::is_caller_save(int assigned_reg) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    62
  assert(assigned_reg >= 0 && assigned_reg < nof_regs, "should call this only for registers");
489c9b5090e2 Initial load
duke
parents:
diff changeset
    63
  return true; // no callee-saved registers on Intel
489c9b5090e2 Initial load
duke
parents:
diff changeset
    64
489c9b5090e2 Initial load
duke
parents:
diff changeset
    65
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    66
489c9b5090e2 Initial load
duke
parents:
diff changeset
    67
489c9b5090e2 Initial load
duke
parents:
diff changeset
    68
inline void LinearScan::pd_add_temps(LIR_Op* op) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    69
  switch (op->code()) {
35540
e001ad24dcdb 8143353: update for x86 sin and cos in the math lib
vdeshpande
parents: 30624
diff changeset
    70
    case lir_tan: {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    71
      // The slow path for these functions may need to save and
489c9b5090e2 Initial load
duke
parents:
diff changeset
    72
      // restore all live registers but we don't want to save and
489c9b5090e2 Initial load
duke
parents:
diff changeset
    73
      // restore everything all the time, so mark the xmms as being
489c9b5090e2 Initial load
duke
parents:
diff changeset
    74
      // killed.  If the slow path were explicit or we could propagate
489c9b5090e2 Initial load
duke
parents:
diff changeset
    75
      // live register masks down to the assembly we could do better
489c9b5090e2 Initial load
duke
parents:
diff changeset
    76
      // but we don't have any easy way to do that right now.  We
489c9b5090e2 Initial load
duke
parents:
diff changeset
    77
      // could also consider not killing all xmm registers if we
489c9b5090e2 Initial load
duke
parents:
diff changeset
    78
      // assume that slow paths are uncommon but it's not clear that
489c9b5090e2 Initial load
duke
parents:
diff changeset
    79
      // would be a good idea.
489c9b5090e2 Initial load
duke
parents:
diff changeset
    80
      if (UseSSE > 0) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    81
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
    82
        if (TraceLinearScanLevel >= 2) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
    83
          tty->print_cr("killing XMMs for trig");
489c9b5090e2 Initial load
duke
parents:
diff changeset
    84
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    85
#endif
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
    86
        int num_caller_save_xmm_regs = FrameMap::get_num_caller_save_xmms();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    87
        int op_id = op->id();
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
    88
        for (int xmm = 0; xmm < num_caller_save_xmm_regs; xmm++) {
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
    89
          LIR_Opr opr = FrameMap::caller_save_xmm_reg_at(xmm);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    90
          add_temp(reg_num(opr), op_id, noUse, T_ILLEGAL);
489c9b5090e2 Initial load
duke
parents:
diff changeset
    91
        }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    92
      }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    93
      break;
489c9b5090e2 Initial load
duke
parents:
diff changeset
    94
    }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    95
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
    96
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
    97
489c9b5090e2 Initial load
duke
parents:
diff changeset
    98
489c9b5090e2 Initial load
duke
parents:
diff changeset
    99
// Implementation of LinearScanWalker
489c9b5090e2 Initial load
duke
parents:
diff changeset
   100
489c9b5090e2 Initial load
duke
parents:
diff changeset
   101
inline bool LinearScanWalker::pd_init_regs_for_alloc(Interval* cur) {
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
   102
  int last_xmm_reg = pd_last_xmm_reg;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
   103
  if (UseAVX < 3) {
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
   104
    last_xmm_reg = pd_first_xmm_reg + (pd_nof_xmm_regs_frame_map / 2) - 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
   105
  }
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   106
  if (allocator()->gen()->is_vreg_flag_set(cur->reg_num(), LIRGenerator::byte_reg)) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   107
    assert(cur->type() != T_FLOAT && cur->type() != T_DOUBLE, "cpu regs only");
489c9b5090e2 Initial load
duke
parents:
diff changeset
   108
    _first_reg = pd_first_byte_reg;
7427
d7b79a367474 6985015: C1 needs to support compressed oops
iveresov
parents: 7397
diff changeset
   109
    _last_reg = FrameMap::last_byte_reg();
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   110
    return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   111
  } else if ((UseSSE >= 1 && cur->type() == T_FLOAT) || (UseSSE >= 2 && cur->type() == T_DOUBLE)) {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   112
    _first_reg = pd_first_xmm_reg;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 7427
diff changeset
   113
    _last_reg = last_xmm_reg;
1
489c9b5090e2 Initial load
duke
parents:
diff changeset
   114
    return true;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   115
  }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   116
489c9b5090e2 Initial load
duke
parents:
diff changeset
   117
  return false;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   118
}
489c9b5090e2 Initial load
duke
parents:
diff changeset
   119
489c9b5090e2 Initial load
duke
parents:
diff changeset
   120
489c9b5090e2 Initial load
duke
parents:
diff changeset
   121
class FpuStackAllocator VALUE_OBJ_CLASS_SPEC {
489c9b5090e2 Initial load
duke
parents:
diff changeset
   122
 private:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   123
  Compilation* _compilation;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   124
  LinearScan* _allocator;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   125
489c9b5090e2 Initial load
duke
parents:
diff changeset
   126
  LIR_OpVisitState visitor;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   127
489c9b5090e2 Initial load
duke
parents:
diff changeset
   128
  LIR_List* _lir;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   129
  int _pos;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   130
  FpuStackSim _sim;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   131
  FpuStackSim _temp_sim;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   132
489c9b5090e2 Initial load
duke
parents:
diff changeset
   133
  bool _debug_information_computed;
489c9b5090e2 Initial load
duke
parents:
diff changeset
   134
489c9b5090e2 Initial load
duke
parents:
diff changeset
   135
  LinearScan*   allocator()                      { return _allocator; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   136
  Compilation*  compilation() const              { return _compilation; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   137
489c9b5090e2 Initial load
duke
parents:
diff changeset
   138
  // unified bailout support
489c9b5090e2 Initial load
duke
parents:
diff changeset
   139
  void          bailout(const char* msg) const   { compilation()->bailout(msg); }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   140
  bool          bailed_out() const               { return compilation()->bailed_out(); }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   141
489c9b5090e2 Initial load
duke
parents:
diff changeset
   142
  int pos() { return _pos; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   143
  void set_pos(int pos) { _pos = pos; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   144
  LIR_Op* cur_op() { return lir()->instructions_list()->at(pos()); }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   145
  LIR_List* lir() { return _lir; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   146
  void set_lir(LIR_List* lir) { _lir = lir; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   147
  FpuStackSim* sim() { return &_sim; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   148
  FpuStackSim* temp_sim() { return &_temp_sim; }
489c9b5090e2 Initial load
duke
parents:
diff changeset
   149
489c9b5090e2 Initial load
duke
parents:
diff changeset
   150
  int fpu_num(LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   151
  int tos_offset(LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   152
  LIR_Opr to_fpu_stack_top(LIR_Opr opr, bool dont_check_offset = false);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   153
489c9b5090e2 Initial load
duke
parents:
diff changeset
   154
  // Helper functions for handling operations
489c9b5090e2 Initial load
duke
parents:
diff changeset
   155
  void insert_op(LIR_Op* op);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   156
  void insert_exchange(int offset);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   157
  void insert_exchange(LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   158
  void insert_free(int offset);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   159
  void insert_free_if_dead(LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   160
  void insert_free_if_dead(LIR_Opr opr, LIR_Opr ignore);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   161
  void insert_copy(LIR_Opr from, LIR_Opr to);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   162
  void do_rename(LIR_Opr from, LIR_Opr to);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   163
  void do_push(LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   164
  void pop_if_last_use(LIR_Op* op, LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   165
  void pop_always(LIR_Op* op, LIR_Opr opr);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   166
  void clear_fpu_stack(LIR_Opr preserve);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   167
  void handle_op1(LIR_Op1* op1);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   168
  void handle_op2(LIR_Op2* op2);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   169
  void handle_opCall(LIR_OpCall* opCall);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   170
  void compute_debug_information(LIR_Op* op);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   171
  void allocate_exception_handler(XHandler* xhandler);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   172
  void allocate_block(BlockBegin* block);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   173
489c9b5090e2 Initial load
duke
parents:
diff changeset
   174
#ifndef PRODUCT
489c9b5090e2 Initial load
duke
parents:
diff changeset
   175
  void check_invalid_lir_op(LIR_Op* op);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   176
#endif
489c9b5090e2 Initial load
duke
parents:
diff changeset
   177
489c9b5090e2 Initial load
duke
parents:
diff changeset
   178
  // Helper functions for merging of fpu stacks
489c9b5090e2 Initial load
duke
parents:
diff changeset
   179
  void merge_insert_add(LIR_List* instrs, FpuStackSim* cur_sim, int reg);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   180
  void merge_insert_xchg(LIR_List* instrs, FpuStackSim* cur_sim, int slot);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   181
  void merge_insert_pop(LIR_List* instrs, FpuStackSim* cur_sim);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   182
  bool merge_rename(FpuStackSim* cur_sim, FpuStackSim* sux_sim, int start_slot, int change_slot);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   183
  void merge_fpu_stack(LIR_List* instrs, FpuStackSim* cur_sim, FpuStackSim* sux_sim);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   184
  void merge_cleanup_fpu_stack(LIR_List* instrs, FpuStackSim* cur_sim, BitMap& live_fpu_regs);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   185
  bool merge_fpu_stack_with_successors(BlockBegin* block);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   186
489c9b5090e2 Initial load
duke
parents:
diff changeset
   187
 public:
489c9b5090e2 Initial load
duke
parents:
diff changeset
   188
  LIR_Opr to_fpu_stack(LIR_Opr opr); // used by LinearScan for creation of debug information
489c9b5090e2 Initial load
duke
parents:
diff changeset
   189
489c9b5090e2 Initial load
duke
parents:
diff changeset
   190
  FpuStackAllocator(Compilation* compilation, LinearScan* allocator);
489c9b5090e2 Initial load
duke
parents:
diff changeset
   191
  void allocate();
489c9b5090e2 Initial load
duke
parents:
diff changeset
   192
};
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
   193
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 5547
diff changeset
   194
#endif // CPU_X86_VM_C1_LINEARSCAN_X86_HPP