7085404: JSR 292: VolatileCallSites should have push notification too
Reviewed-by: never, kvn
/*
* Copyright (c) 1997, 2011, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*
*/
#include "precompiled.hpp"
#include "classfile/classLoader.hpp"
#include "code/vtableStubs.hpp"
#include "gc_interface/collectedHeap.inline.hpp"
#include "interpreter/interpreter.hpp"
#include "memory/allocation.inline.hpp"
#include "memory/universe.inline.hpp"
#include "oops/oop.inline.hpp"
#include "oops/oop.inline2.hpp"
#include "oops/symbol.hpp"
#include "runtime/deoptimization.hpp"
#include "runtime/fprofiler.hpp"
#include "runtime/mutexLocker.hpp"
#include "runtime/stubCodeGenerator.hpp"
#include "runtime/stubRoutines.hpp"
#include "runtime/task.hpp"
#include "runtime/vframe.hpp"
#include "utilities/macros.hpp"
// Static fields of FlatProfiler
int FlatProfiler::received_gc_ticks = 0;
int FlatProfiler::vm_operation_ticks = 0;
int FlatProfiler::threads_lock_ticks = 0;
int FlatProfiler::class_loader_ticks = 0;
int FlatProfiler::extra_ticks = 0;
int FlatProfiler::blocked_ticks = 0;
int FlatProfiler::deopt_ticks = 0;
int FlatProfiler::unknown_ticks = 0;
int FlatProfiler::interpreter_ticks = 0;
int FlatProfiler::compiler_ticks = 0;
int FlatProfiler::received_ticks = 0;
int FlatProfiler::delivered_ticks = 0;
int* FlatProfiler::bytecode_ticks = NULL;
int* FlatProfiler::bytecode_ticks_stub = NULL;
int FlatProfiler::all_int_ticks = 0;
int FlatProfiler::all_comp_ticks = 0;
int FlatProfiler::all_ticks = 0;
bool FlatProfiler::full_profile_flag = false;
ThreadProfiler* FlatProfiler::thread_profiler = NULL;
ThreadProfiler* FlatProfiler::vm_thread_profiler = NULL;
FlatProfilerTask* FlatProfiler::task = NULL;
elapsedTimer FlatProfiler::timer;
int FlatProfiler::interval_ticks_previous = 0;
IntervalData* FlatProfiler::interval_data = NULL;
ThreadProfiler::ThreadProfiler() {
// Space for the ProfilerNodes
const int area_size = 1 * ProfilerNodeSize * 1024;
area_bottom = AllocateHeap(area_size, "fprofiler");
area_top = area_bottom;
area_limit = area_bottom + area_size;
// ProfilerNode pointer table
table = NEW_C_HEAP_ARRAY(ProfilerNode*, table_size);
initialize();
engaged = false;
}
ThreadProfiler::~ThreadProfiler() {
FreeHeap(area_bottom);
area_bottom = NULL;
area_top = NULL;
area_limit = NULL;
FreeHeap(table);
table = NULL;
}
// Statics for ThreadProfiler
int ThreadProfiler::table_size = 1024;
int ThreadProfiler::entry(int value) {
value = (value > 0) ? value : -value;
return value % table_size;
}
ThreadProfilerMark::ThreadProfilerMark(ThreadProfilerMark::Region r) {
_r = r;
_pp = NULL;
assert(((r > ThreadProfilerMark::noRegion) && (r < ThreadProfilerMark::maxRegion)), "ThreadProfilerMark::Region out of bounds");
Thread* tp = Thread::current();
if (tp != NULL && tp->is_Java_thread()) {
JavaThread* jtp = (JavaThread*) tp;
ThreadProfiler* pp = jtp->get_thread_profiler();
_pp = pp;
if (pp != NULL) {
pp->region_flag[r] = true;
}
}
}
ThreadProfilerMark::~ThreadProfilerMark() {
if (_pp != NULL) {
_pp->region_flag[_r] = false;
}
_pp = NULL;
}
// Random other statics
static const int col1 = 2; // position of output column 1
static const int col2 = 11; // position of output column 2
static const int col3 = 25; // position of output column 3
static const int col4 = 55; // position of output column 4
// Used for detailed profiling of nmethods.
class PCRecorder : AllStatic {
private:
static int* counters;
static address base;
enum {
bucket_size = 16
};
static int index_for(address pc) { return (pc - base)/bucket_size; }
static address pc_for(int index) { return base + (index * bucket_size); }
static int size() {
return ((int)CodeCache::max_capacity())/bucket_size * BytesPerWord;
}
public:
static address bucket_start_for(address pc) {
if (counters == NULL) return NULL;
return pc_for(index_for(pc));
}
static int bucket_count_for(address pc) { return counters[index_for(pc)]; }
static void init();
static void record(address pc);
static void print();
static void print_blobs(CodeBlob* cb);
};
int* PCRecorder::counters = NULL;
address PCRecorder::base = NULL;
void PCRecorder::init() {
MutexLockerEx lm(CodeCache_lock, Mutex::_no_safepoint_check_flag);
int s = size();
counters = NEW_C_HEAP_ARRAY(int, s);
for (int index = 0; index < s; index++) {
counters[index] = 0;
}
base = CodeCache::first_address();
}
void PCRecorder::record(address pc) {
if (counters == NULL) return;
assert(CodeCache::contains(pc), "must be in CodeCache");
counters[index_for(pc)]++;
}
address FlatProfiler::bucket_start_for(address pc) {
return PCRecorder::bucket_start_for(pc);
}
int FlatProfiler::bucket_count_for(address pc) {
return PCRecorder::bucket_count_for(pc);
}
void PCRecorder::print() {
if (counters == NULL) return;
tty->cr();
tty->print_cr("Printing compiled methods with PC buckets having more than %d ticks", ProfilerPCTickThreshold);
tty->print_cr("===================================================================");
tty->cr();
GrowableArray<CodeBlob*>* candidates = new GrowableArray<CodeBlob*>(20);
int s;
{
MutexLockerEx lm(CodeCache_lock, Mutex::_no_safepoint_check_flag);
s = size();
}
for (int index = 0; index < s; index++) {
int count = counters[index];
if (count > ProfilerPCTickThreshold) {
address pc = pc_for(index);
CodeBlob* cb = CodeCache::find_blob_unsafe(pc);
if (cb != NULL && candidates->find(cb) < 0) {
candidates->push(cb);
}
}
}
for (int i = 0; i < candidates->length(); i++) {
print_blobs(candidates->at(i));
}
}
void PCRecorder::print_blobs(CodeBlob* cb) {
if (cb != NULL) {
cb->print();
if (cb->is_nmethod()) {
((nmethod*)cb)->print_code();
}
tty->cr();
} else {
tty->print_cr("stub code");
}
}
class tick_counter { // holds tick info for one node
public:
int ticks_in_code;
int ticks_in_native;
tick_counter() { ticks_in_code = ticks_in_native = 0; }
tick_counter(int code, int native) { ticks_in_code = code; ticks_in_native = native; }
int total() const {
return (ticks_in_code + ticks_in_native);
}
void add(tick_counter* a) {
ticks_in_code += a->ticks_in_code;
ticks_in_native += a->ticks_in_native;
}
void update(TickPosition where) {
switch(where) {
case tp_code: ticks_in_code++; break;
case tp_native: ticks_in_native++; break;
}
}
void print_code(outputStream* st, int total_ticks) {
st->print("%5.1f%% %5d ", total() * 100.0 / total_ticks, ticks_in_code);
}
void print_native(outputStream* st) {
st->print(" + %5d ", ticks_in_native);
}
};
class ProfilerNode {
private:
ProfilerNode* _next;
public:
tick_counter ticks;
public:
void* operator new(size_t size, ThreadProfiler* tp);
void operator delete(void* p);
ProfilerNode() {
_next = NULL;
}
virtual ~ProfilerNode() {
if (_next)
delete _next;
}
void set_next(ProfilerNode* n) { _next = n; }
ProfilerNode* next() { return _next; }
void update(TickPosition where) { ticks.update(where);}
int total_ticks() { return ticks.total(); }
virtual bool is_interpreted() const { return false; }
virtual bool is_compiled() const { return false; }
virtual bool is_stub() const { return false; }
virtual bool is_runtime_stub() const{ return false; }
virtual void oops_do(OopClosure* f) = 0;
virtual bool interpreted_match(methodOop m) const { return false; }
virtual bool compiled_match(methodOop m ) const { return false; }
virtual bool stub_match(methodOop m, const char* name) const { return false; }
virtual bool adapter_match() const { return false; }
virtual bool runtimeStub_match(const CodeBlob* stub, const char* name) const { return false; }
virtual bool unknown_compiled_match(const CodeBlob* cb) const { return false; }
static void print_title(outputStream* st) {
st->print(" + native");
st->fill_to(col3);
st->print("Method");
st->fill_to(col4);
st->cr();
}
static void print_total(outputStream* st, tick_counter* t, int total, const char* msg) {
t->print_code(st, total);
st->fill_to(col2);
t->print_native(st);
st->fill_to(col3);
st->print(msg);
st->cr();
}
virtual methodOop method() = 0;
virtual void print_method_on(outputStream* st) {
int limit;
int i;
methodOop m = method();
Symbol* k = m->klass_name();
// Print the class name with dots instead of slashes
limit = k->utf8_length();
for (i = 0 ; i < limit ; i += 1) {
char c = (char) k->byte_at(i);
if (c == '/') {
c = '.';
}
st->print("%c", c);
}
if (limit > 0) {
st->print(".");
}
Symbol* n = m->name();
limit = n->utf8_length();
for (i = 0 ; i < limit ; i += 1) {
char c = (char) n->byte_at(i);
st->print("%c", c);
}
if( Verbose ) {
// Disambiguate overloaded methods
Symbol* sig = m->signature();
sig->print_symbol_on(st);
}
}
virtual void print(outputStream* st, int total_ticks) {
ticks.print_code(st, total_ticks);
st->fill_to(col2);
ticks.print_native(st);
st->fill_to(col3);
print_method_on(st);
st->cr();
}
// for hashing into the table
static int hash(methodOop method) {
// The point here is to try to make something fairly unique
// out of the fields we can read without grabbing any locks
// since the method may be locked when we need the hash.
return (
method->code_size() ^
method->max_stack() ^
method->max_locals() ^
method->size_of_parameters());
}
// for sorting
static int compare(ProfilerNode** a, ProfilerNode** b) {
return (*b)->total_ticks() - (*a)->total_ticks();
}
};
void* ProfilerNode::operator new(size_t size, ThreadProfiler* tp){
void* result = (void*) tp->area_top;
tp->area_top += size;
if (tp->area_top > tp->area_limit) {
fatal("flat profiler buffer overflow");
}
return result;
}
void ProfilerNode::operator delete(void* p){
}
class interpretedNode : public ProfilerNode {
private:
methodOop _method;
public:
interpretedNode(methodOop method, TickPosition where) : ProfilerNode() {
_method = method;
update(where);
}
bool is_interpreted() const { return true; }
bool interpreted_match(methodOop m) const {
return _method == m;
}
void oops_do(OopClosure* f) {
f->do_oop((oop*)&_method);
}
methodOop method() { return _method; }
static void print_title(outputStream* st) {
st->fill_to(col1);
st->print("%11s", "Interpreted");
ProfilerNode::print_title(st);
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
ProfilerNode::print_method_on(st);
if (Verbose) method()->invocation_counter()->print_short();
}
};
class compiledNode : public ProfilerNode {
private:
methodOop _method;
public:
compiledNode(methodOop method, TickPosition where) : ProfilerNode() {
_method = method;
update(where);
}
bool is_compiled() const { return true; }
bool compiled_match(methodOop m) const {
return _method == m;
}
methodOop method() { return _method; }
void oops_do(OopClosure* f) {
f->do_oop((oop*)&_method);
}
static void print_title(outputStream* st) {
st->fill_to(col1);
st->print("%11s", "Compiled");
ProfilerNode::print_title(st);
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
ProfilerNode::print_method_on(st);
}
};
class stubNode : public ProfilerNode {
private:
methodOop _method;
const char* _symbol; // The name of the nearest VM symbol (for +ProfileVM). Points to a unique string
public:
stubNode(methodOop method, const char* name, TickPosition where) : ProfilerNode() {
_method = method;
_symbol = name;
update(where);
}
bool is_stub() const { return true; }
bool stub_match(methodOop m, const char* name) const {
return (_method == m) && (_symbol == name);
}
void oops_do(OopClosure* f) {
f->do_oop((oop*)&_method);
}
methodOop method() { return _method; }
static void print_title(outputStream* st) {
st->fill_to(col1);
st->print("%11s", "Stub");
ProfilerNode::print_title(st);
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
ProfilerNode::print_method_on(st);
print_symbol_on(st);
}
void print_symbol_on(outputStream* st) {
if(_symbol) {
st->print(" (%s)", _symbol);
}
}
};
class adapterNode : public ProfilerNode {
public:
adapterNode(TickPosition where) : ProfilerNode() {
update(where);
}
bool is_compiled() const { return true; }
bool adapter_match() const { return true; }
methodOop method() { return NULL; }
void oops_do(OopClosure* f) {
;
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
st->print("%s", "adapters");
}
};
class runtimeStubNode : public ProfilerNode {
private:
const CodeBlob* _stub;
const char* _symbol; // The name of the nearest VM symbol when ProfileVM is on. Points to a unique string.
public:
runtimeStubNode(const CodeBlob* stub, const char* name, TickPosition where) : ProfilerNode(), _stub(stub), _symbol(name) {
assert(stub->is_runtime_stub(), "wrong code blob");
update(where);
}
bool is_runtime_stub() const { return true; }
bool runtimeStub_match(const CodeBlob* stub, const char* name) const {
assert(stub->is_runtime_stub(), "wrong code blob");
return ((RuntimeStub*)_stub)->entry_point() == ((RuntimeStub*)stub)->entry_point() &&
(_symbol == name);
}
methodOop method() { return NULL; }
static void print_title(outputStream* st) {
st->fill_to(col1);
st->print("%11s", "Runtime stub");
ProfilerNode::print_title(st);
}
void oops_do(OopClosure* f) {
;
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
st->print("%s", ((RuntimeStub*)_stub)->name());
print_symbol_on(st);
}
void print_symbol_on(outputStream* st) {
if(_symbol) {
st->print(" (%s)", _symbol);
}
}
};
class unknown_compiledNode : public ProfilerNode {
const char *_name;
public:
unknown_compiledNode(const CodeBlob* cb, TickPosition where) : ProfilerNode() {
if ( cb->is_buffer_blob() )
_name = ((BufferBlob*)cb)->name();
else
_name = ((SingletonBlob*)cb)->name();
update(where);
}
bool is_compiled() const { return true; }
bool unknown_compiled_match(const CodeBlob* cb) const {
if ( cb->is_buffer_blob() )
return !strcmp(((BufferBlob*)cb)->name(), _name);
else
return !strcmp(((SingletonBlob*)cb)->name(), _name);
}
methodOop method() { return NULL; }
void oops_do(OopClosure* f) {
;
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
st->print("%s", _name);
}
};
class vmNode : public ProfilerNode {
private:
const char* _name; // "optional" name obtained by os means such as dll lookup
public:
vmNode(const TickPosition where) : ProfilerNode() {
_name = NULL;
update(where);
}
vmNode(const char* name, const TickPosition where) : ProfilerNode() {
_name = name;
update(where);
}
const char *name() const { return _name; }
bool is_compiled() const { return true; }
bool vm_match(const char* name) const { return strcmp(name, _name) == 0; }
methodOop method() { return NULL; }
static int hash(const char* name){
// Compute a simple hash
const char* cp = name;
int h = 0;
if(name != NULL){
while(*cp != '\0'){
h = (h << 1) ^ *cp;
cp++;
}
}
return h;
}
void oops_do(OopClosure* f) {
;
}
void print(outputStream* st, int total_ticks) {
ProfilerNode::print(st, total_ticks);
}
void print_method_on(outputStream* st) {
if(_name==NULL){
st->print("%s", "unknown code");
}
else {
st->print("%s", _name);
}
}
};
void ThreadProfiler::interpreted_update(methodOop method, TickPosition where) {
int index = entry(ProfilerNode::hash(method));
if (!table[index]) {
table[index] = new (this) interpretedNode(method, where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->interpreted_match(method)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) interpretedNode(method, where));
}
}
void ThreadProfiler::compiled_update(methodOop method, TickPosition where) {
int index = entry(ProfilerNode::hash(method));
if (!table[index]) {
table[index] = new (this) compiledNode(method, where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->compiled_match(method)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) compiledNode(method, where));
}
}
void ThreadProfiler::stub_update(methodOop method, const char* name, TickPosition where) {
int index = entry(ProfilerNode::hash(method));
if (!table[index]) {
table[index] = new (this) stubNode(method, name, where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->stub_match(method, name)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) stubNode(method, name, where));
}
}
void ThreadProfiler::adapter_update(TickPosition where) {
int index = 0;
if (!table[index]) {
table[index] = new (this) adapterNode(where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->adapter_match()) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) adapterNode(where));
}
}
void ThreadProfiler::runtime_stub_update(const CodeBlob* stub, const char* name, TickPosition where) {
int index = 0;
if (!table[index]) {
table[index] = new (this) runtimeStubNode(stub, name, where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->runtimeStub_match(stub, name)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) runtimeStubNode(stub, name, where));
}
}
void ThreadProfiler::unknown_compiled_update(const CodeBlob* cb, TickPosition where) {
int index = 0;
if (!table[index]) {
table[index] = new (this) unknown_compiledNode(cb, where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (node->unknown_compiled_match(cb)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) unknown_compiledNode(cb, where));
}
}
void ThreadProfiler::vm_update(TickPosition where) {
vm_update(NULL, where);
}
void ThreadProfiler::vm_update(const char* name, TickPosition where) {
int index = entry(vmNode::hash(name));
assert(index >= 0, "Must be positive");
// Note that we call strdup below since the symbol may be resource allocated
if (!table[index]) {
table[index] = new (this) vmNode(os::strdup(name), where);
} else {
ProfilerNode* prev = table[index];
for(ProfilerNode* node = prev; node; node = node->next()) {
if (((vmNode *)node)->vm_match(name)) {
node->update(where);
return;
}
prev = node;
}
prev->set_next(new (this) vmNode(os::strdup(name), where));
}
}
class FlatProfilerTask : public PeriodicTask {
public:
FlatProfilerTask(int interval_time) : PeriodicTask(interval_time) {}
void task();
};
void FlatProfiler::record_vm_operation() {
if (Universe::heap()->is_gc_active()) {
FlatProfiler::received_gc_ticks += 1;
return;
}
if (DeoptimizationMarker::is_active()) {
FlatProfiler::deopt_ticks += 1;
return;
}
FlatProfiler::vm_operation_ticks += 1;
}
void FlatProfiler::record_vm_tick() {
// Profile the VM Thread itself if needed
// This is done without getting the Threads_lock and we can go deep
// inside Safepoint, etc.
if( ProfileVM ) {
ResourceMark rm;
ExtendedPC epc;
const char *name = NULL;
char buf[256];
buf[0] = '\0';
vm_thread_profiler->inc_thread_ticks();
// Get a snapshot of a current VMThread pc (and leave it running!)
// The call may fail if, for instance the VM thread is interrupted while
// holding the Interrupt_lock or for other reasons.
epc = os::get_thread_pc(VMThread::vm_thread());
if(epc.pc() != NULL) {
if (os::dll_address_to_function_name(epc.pc(), buf, sizeof(buf), NULL)) {
name = buf;
}
}
if (name != NULL) {
vm_thread_profiler->vm_update(name, tp_native);
}
}
}
void FlatProfiler::record_thread_ticks() {
int maxthreads, suspendedthreadcount;
JavaThread** threadsList;
bool interval_expired = false;
if (ProfileIntervals &&
(FlatProfiler::received_ticks >= interval_ticks_previous + ProfileIntervalsTicks)) {
interval_expired = true;
interval_ticks_previous = FlatProfiler::received_ticks;
}
// Try not to wait for the Threads_lock
if (Threads_lock->try_lock()) {
{ // Threads_lock scope
maxthreads = Threads::number_of_threads();
threadsList = NEW_C_HEAP_ARRAY(JavaThread *, maxthreads);
suspendedthreadcount = 0;
for (JavaThread* tp = Threads::first(); tp != NULL; tp = tp->next()) {
if (tp->is_Compiler_thread()) {
// Only record ticks for active compiler threads
CompilerThread* cthread = (CompilerThread*)tp;
if (cthread->task() != NULL) {
// The compiler is active. If we need to access any of the fields
// of the compiler task we should suspend the CompilerThread first.
FlatProfiler::compiler_ticks += 1;
continue;
}
}
// First externally suspend all threads by marking each for
// external suspension - so it will stop at its next transition
// Then do a safepoint
ThreadProfiler* pp = tp->get_thread_profiler();
if (pp != NULL && pp->engaged) {
MutexLockerEx ml(tp->SR_lock(), Mutex::_no_safepoint_check_flag);
if (!tp->is_external_suspend() && !tp->is_exiting()) {
tp->set_external_suspend();
threadsList[suspendedthreadcount++] = tp;
}
}
}
Threads_lock->unlock();
}
// Suspend each thread. This call should just return
// for any threads that have already self-suspended
// Net result should be one safepoint
for (int j = 0; j < suspendedthreadcount; j++) {
JavaThread *tp = threadsList[j];
if (tp) {
tp->java_suspend();
}
}
// We are responsible for resuming any thread on this list
for (int i = 0; i < suspendedthreadcount; i++) {
JavaThread *tp = threadsList[i];
if (tp) {
ThreadProfiler* pp = tp->get_thread_profiler();
if (pp != NULL && pp->engaged) {
HandleMark hm;
FlatProfiler::delivered_ticks += 1;
if (interval_expired) {
FlatProfiler::interval_record_thread(pp);
}
// This is the place where we check to see if a user thread is
// blocked waiting for compilation.
if (tp->blocked_on_compilation()) {
pp->compiler_ticks += 1;
pp->interval_data_ref()->inc_compiling();
} else {
pp->record_tick(tp);
}
}
MutexLocker ml(Threads_lock);
tp->java_resume();
}
}
if (interval_expired) {
FlatProfiler::interval_print();
FlatProfiler::interval_reset();
}
} else {
// Couldn't get the threads lock, just record that rather than blocking
FlatProfiler::threads_lock_ticks += 1;
}
}
void FlatProfilerTask::task() {
FlatProfiler::received_ticks += 1;
if (ProfileVM) {
FlatProfiler::record_vm_tick();
}
VM_Operation* op = VMThread::vm_operation();
if (op != NULL) {
FlatProfiler::record_vm_operation();
if (SafepointSynchronize::is_at_safepoint()) {
return;
}
}
FlatProfiler::record_thread_ticks();
}
void ThreadProfiler::record_interpreted_tick(JavaThread* thread, frame fr, TickPosition where, int* ticks) {
FlatProfiler::all_int_ticks++;
if (!FlatProfiler::full_profile()) {
return;
}
if (!fr.is_interpreted_frame_valid(thread)) {
// tick came at a bad time
interpreter_ticks += 1;
FlatProfiler::interpreter_ticks += 1;
return;
}
// The frame has been fully validated so we can trust the method and bci
methodOop method = *fr.interpreter_frame_method_addr();
interpreted_update(method, where);
// update byte code table
InterpreterCodelet* desc = Interpreter::codelet_containing(fr.pc());
if (desc != NULL && desc->bytecode() >= 0) {
ticks[desc->bytecode()]++;
}
}
void ThreadProfiler::record_compiled_tick(JavaThread* thread, frame fr, TickPosition where) {
const char *name = NULL;
TickPosition localwhere = where;
FlatProfiler::all_comp_ticks++;
if (!FlatProfiler::full_profile()) return;
CodeBlob* cb = fr.cb();
// For runtime stubs, record as native rather than as compiled
if (cb->is_runtime_stub()) {
RegisterMap map(thread, false);
fr = fr.sender(&map);
cb = fr.cb();
localwhere = tp_native;
}
methodOop method = (cb->is_nmethod()) ? ((nmethod *)cb)->method() :
(methodOop)NULL;
if (method == NULL) {
if (cb->is_runtime_stub())
runtime_stub_update(cb, name, localwhere);
else
unknown_compiled_update(cb, localwhere);
}
else {
if (method->is_native()) {
stub_update(method, name, localwhere);
} else {
compiled_update(method, localwhere);
}
}
}
extern "C" void find(int x);
void ThreadProfiler::record_tick_for_running_frame(JavaThread* thread, frame fr) {
// The tick happened in real code -> non VM code
if (fr.is_interpreted_frame()) {
interval_data_ref()->inc_interpreted();
record_interpreted_tick(thread, fr, tp_code, FlatProfiler::bytecode_ticks);
return;
}
if (CodeCache::contains(fr.pc())) {
interval_data_ref()->inc_compiled();
PCRecorder::record(fr.pc());
record_compiled_tick(thread, fr, tp_code);
return;
}
if (VtableStubs::stub_containing(fr.pc()) != NULL) {
unknown_ticks_array[ut_vtable_stubs] += 1;
return;
}
frame caller = fr.profile_find_Java_sender_frame(thread);
if (caller.sp() != NULL && caller.pc() != NULL) {
record_tick_for_calling_frame(thread, caller);
return;
}
unknown_ticks_array[ut_running_frame] += 1;
FlatProfiler::unknown_ticks += 1;
}
void ThreadProfiler::record_tick_for_calling_frame(JavaThread* thread, frame fr) {
// The tick happened in VM code
interval_data_ref()->inc_native();
if (fr.is_interpreted_frame()) {
record_interpreted_tick(thread, fr, tp_native, FlatProfiler::bytecode_ticks_stub);
return;
}
if (CodeCache::contains(fr.pc())) {
record_compiled_tick(thread, fr, tp_native);
return;
}
frame caller = fr.profile_find_Java_sender_frame(thread);
if (caller.sp() != NULL && caller.pc() != NULL) {
record_tick_for_calling_frame(thread, caller);
return;
}
unknown_ticks_array[ut_calling_frame] += 1;
FlatProfiler::unknown_ticks += 1;
}
void ThreadProfiler::record_tick(JavaThread* thread) {
FlatProfiler::all_ticks++;
thread_ticks += 1;
// Here's another way to track global state changes.
// When the class loader starts it marks the ThreadProfiler to tell it it is in the class loader
// and we check that here.
// This is more direct, and more than one thread can be in the class loader at a time,
// but it does mean the class loader has to know about the profiler.
if (region_flag[ThreadProfilerMark::classLoaderRegion]) {
class_loader_ticks += 1;
FlatProfiler::class_loader_ticks += 1;
return;
} else if (region_flag[ThreadProfilerMark::extraRegion]) {
extra_ticks += 1;
FlatProfiler::extra_ticks += 1;
return;
}
// Note that the WatcherThread can now stop for safepoints
uint32_t debug_bits = 0;
if (!thread->wait_for_ext_suspend_completion(SuspendRetryCount,
SuspendRetryDelay, &debug_bits)) {
unknown_ticks_array[ut_unknown_thread_state] += 1;
FlatProfiler::unknown_ticks += 1;
return;
}
frame fr;
switch (thread->thread_state()) {
case _thread_in_native:
case _thread_in_native_trans:
case _thread_in_vm:
case _thread_in_vm_trans:
if (thread->profile_last_Java_frame(&fr)) {
if (fr.is_runtime_frame()) {
RegisterMap map(thread, false);
fr = fr.sender(&map);
}
record_tick_for_calling_frame(thread, fr);
} else {
unknown_ticks_array[ut_no_last_Java_frame] += 1;
FlatProfiler::unknown_ticks += 1;
}
break;
// handle_special_runtime_exit_condition self-suspends threads in Java
case _thread_in_Java:
case _thread_in_Java_trans:
if (thread->profile_last_Java_frame(&fr)) {
if (fr.is_safepoint_blob_frame()) {
RegisterMap map(thread, false);
fr = fr.sender(&map);
}
record_tick_for_running_frame(thread, fr);
} else {
unknown_ticks_array[ut_no_last_Java_frame] += 1;
FlatProfiler::unknown_ticks += 1;
}
break;
case _thread_blocked:
case _thread_blocked_trans:
if (thread->osthread() && thread->osthread()->get_state() == RUNNABLE) {
if (thread->profile_last_Java_frame(&fr)) {
if (fr.is_safepoint_blob_frame()) {
RegisterMap map(thread, false);
fr = fr.sender(&map);
record_tick_for_running_frame(thread, fr);
} else {
record_tick_for_calling_frame(thread, fr);
}
} else {
unknown_ticks_array[ut_no_last_Java_frame] += 1;
FlatProfiler::unknown_ticks += 1;
}
} else {
blocked_ticks += 1;
FlatProfiler::blocked_ticks += 1;
}
break;
case _thread_uninitialized:
case _thread_new:
// not used, included for completeness
case _thread_new_trans:
unknown_ticks_array[ut_no_last_Java_frame] += 1;
FlatProfiler::unknown_ticks += 1;
break;
default:
unknown_ticks_array[ut_unknown_thread_state] += 1;
FlatProfiler::unknown_ticks += 1;
break;
}
return;
}
void ThreadProfiler::engage() {
engaged = true;
timer.start();
}
void ThreadProfiler::disengage() {
engaged = false;
timer.stop();
}
void ThreadProfiler::initialize() {
for (int index = 0; index < table_size; index++) {
table[index] = NULL;
}
thread_ticks = 0;
blocked_ticks = 0;
compiler_ticks = 0;
interpreter_ticks = 0;
for (int ut = 0; ut < ut_end; ut += 1) {
unknown_ticks_array[ut] = 0;
}
region_flag[ThreadProfilerMark::classLoaderRegion] = false;
class_loader_ticks = 0;
region_flag[ThreadProfilerMark::extraRegion] = false;
extra_ticks = 0;
timer.start();
interval_data_ref()->reset();
}
void ThreadProfiler::reset() {
timer.stop();
if (table != NULL) {
for (int index = 0; index < table_size; index++) {
ProfilerNode* n = table[index];
if (n != NULL) {
delete n;
}
}
}
initialize();
}
void FlatProfiler::allocate_table() {
{ // Bytecode table
bytecode_ticks = NEW_C_HEAP_ARRAY(int, Bytecodes::number_of_codes);
bytecode_ticks_stub = NEW_C_HEAP_ARRAY(int, Bytecodes::number_of_codes);
for(int index = 0; index < Bytecodes::number_of_codes; index++) {
bytecode_ticks[index] = 0;
bytecode_ticks_stub[index] = 0;
}
}
if (ProfilerRecordPC) PCRecorder::init();
interval_data = NEW_C_HEAP_ARRAY(IntervalData, interval_print_size);
FlatProfiler::interval_reset();
}
void FlatProfiler::engage(JavaThread* mainThread, bool fullProfile) {
full_profile_flag = fullProfile;
if (bytecode_ticks == NULL) {
allocate_table();
}
if(ProfileVM && (vm_thread_profiler == NULL)){
vm_thread_profiler = new ThreadProfiler();
}
if (task == NULL) {
task = new FlatProfilerTask(WatcherThread::delay_interval);
task->enroll();
}
timer.start();
if (mainThread != NULL) {
// When mainThread was created, it might not have a ThreadProfiler
ThreadProfiler* pp = mainThread->get_thread_profiler();
if (pp == NULL) {
mainThread->set_thread_profiler(new ThreadProfiler());
} else {
pp->reset();
}
mainThread->get_thread_profiler()->engage();
}
// This is where we would assign thread_profiler
// if we wanted only one thread_profiler for all threads.
thread_profiler = NULL;
}
void FlatProfiler::disengage() {
if (!task) {
return;
}
timer.stop();
task->disenroll();
delete task;
task = NULL;
if (thread_profiler != NULL) {
thread_profiler->disengage();
} else {
MutexLocker tl(Threads_lock);
for (JavaThread* tp = Threads::first(); tp != NULL; tp = tp->next()) {
ThreadProfiler* pp = tp->get_thread_profiler();
if (pp != NULL) {
pp->disengage();
}
}
}
}
void FlatProfiler::reset() {
if (task) {
disengage();
}
class_loader_ticks = 0;
extra_ticks = 0;
received_gc_ticks = 0;
vm_operation_ticks = 0;
compiler_ticks = 0;
deopt_ticks = 0;
interpreter_ticks = 0;
blocked_ticks = 0;
unknown_ticks = 0;
received_ticks = 0;
delivered_ticks = 0;
timer.stop();
}
bool FlatProfiler::is_active() {
return task != NULL;
}
void FlatProfiler::print_byte_code_statistics() {
GrowableArray <ProfilerNode*>* array = new GrowableArray<ProfilerNode*>(200);
tty->print_cr(" Bytecode ticks:");
for (int index = 0; index < Bytecodes::number_of_codes; index++) {
if (FlatProfiler::bytecode_ticks[index] > 0 || FlatProfiler::bytecode_ticks_stub[index] > 0) {
tty->print_cr(" %4d %4d = %s",
FlatProfiler::bytecode_ticks[index],
FlatProfiler::bytecode_ticks_stub[index],
Bytecodes::name( (Bytecodes::Code) index));
}
}
tty->cr();
}
void print_ticks(const char* title, int ticks, int total) {
if (ticks > 0) {
tty->print("%5.1f%% %5d", ticks * 100.0 / total, ticks);
tty->fill_to(col3);
tty->print("%s", title);
tty->cr();
}
}
void ThreadProfiler::print(const char* thread_name) {
ResourceMark rm;
MutexLocker ppl(ProfilePrint_lock);
int index = 0; // Declared outside for loops for portability
if (table == NULL) {
return;
}
if (thread_ticks <= 0) {
return;
}
const char* title = "too soon to tell";
double secs = timer.seconds();
GrowableArray <ProfilerNode*>* array = new GrowableArray<ProfilerNode*>(200);
for(index = 0; index < table_size; index++) {
for(ProfilerNode* node = table[index]; node; node = node->next())
array->append(node);
}
array->sort(&ProfilerNode::compare);
// compute total (sanity check)
int active =
class_loader_ticks +
compiler_ticks +
interpreter_ticks +
unknown_ticks();
for (index = 0; index < array->length(); index++) {
active += array->at(index)->ticks.total();
}
int total = active + blocked_ticks;
tty->cr();
tty->print_cr("Flat profile of %3.2f secs (%d total ticks): %s", secs, total, thread_name);
if (total != thread_ticks) {
print_ticks("Lost ticks", thread_ticks-total, thread_ticks);
}
tty->cr();
// print interpreted methods
tick_counter interpreted_ticks;
bool has_interpreted_ticks = false;
int print_count = 0;
for (index = 0; index < array->length(); index++) {
ProfilerNode* n = array->at(index);
if (n->is_interpreted()) {
interpreted_ticks.add(&n->ticks);
if (!has_interpreted_ticks) {
interpretedNode::print_title(tty);
has_interpreted_ticks = true;
}
if (print_count++ < ProfilerNumberOfInterpretedMethods) {
n->print(tty, active);
}
}
}
if (has_interpreted_ticks) {
if (print_count <= ProfilerNumberOfInterpretedMethods) {
title = "Total interpreted";
} else {
title = "Total interpreted (including elided)";
}
interpretedNode::print_total(tty, &interpreted_ticks, active, title);
tty->cr();
}
// print compiled methods
tick_counter compiled_ticks;
bool has_compiled_ticks = false;
print_count = 0;
for (index = 0; index < array->length(); index++) {
ProfilerNode* n = array->at(index);
if (n->is_compiled()) {
compiled_ticks.add(&n->ticks);
if (!has_compiled_ticks) {
compiledNode::print_title(tty);
has_compiled_ticks = true;
}
if (print_count++ < ProfilerNumberOfCompiledMethods) {
n->print(tty, active);
}
}
}
if (has_compiled_ticks) {
if (print_count <= ProfilerNumberOfCompiledMethods) {
title = "Total compiled";
} else {
title = "Total compiled (including elided)";
}
compiledNode::print_total(tty, &compiled_ticks, active, title);
tty->cr();
}
// print stub methods
tick_counter stub_ticks;
bool has_stub_ticks = false;
print_count = 0;
for (index = 0; index < array->length(); index++) {
ProfilerNode* n = array->at(index);
if (n->is_stub()) {
stub_ticks.add(&n->ticks);
if (!has_stub_ticks) {
stubNode::print_title(tty);
has_stub_ticks = true;
}
if (print_count++ < ProfilerNumberOfStubMethods) {
n->print(tty, active);
}
}
}
if (has_stub_ticks) {
if (print_count <= ProfilerNumberOfStubMethods) {
title = "Total stub";
} else {
title = "Total stub (including elided)";
}
stubNode::print_total(tty, &stub_ticks, active, title);
tty->cr();
}
// print runtime stubs
tick_counter runtime_stub_ticks;
bool has_runtime_stub_ticks = false;
print_count = 0;
for (index = 0; index < array->length(); index++) {
ProfilerNode* n = array->at(index);
if (n->is_runtime_stub()) {
runtime_stub_ticks.add(&n->ticks);
if (!has_runtime_stub_ticks) {
runtimeStubNode::print_title(tty);
has_runtime_stub_ticks = true;
}
if (print_count++ < ProfilerNumberOfRuntimeStubNodes) {
n->print(tty, active);
}
}
}
if (has_runtime_stub_ticks) {
if (print_count <= ProfilerNumberOfRuntimeStubNodes) {
title = "Total runtime stubs";
} else {
title = "Total runtime stubs (including elided)";
}
runtimeStubNode::print_total(tty, &runtime_stub_ticks, active, title);
tty->cr();
}
if (blocked_ticks + class_loader_ticks + interpreter_ticks + compiler_ticks + unknown_ticks() != 0) {
tty->fill_to(col1);
tty->print_cr("Thread-local ticks:");
print_ticks("Blocked (of total)", blocked_ticks, total);
print_ticks("Class loader", class_loader_ticks, active);
print_ticks("Extra", extra_ticks, active);
print_ticks("Interpreter", interpreter_ticks, active);
print_ticks("Compilation", compiler_ticks, active);
print_ticks("Unknown: vtable stubs", unknown_ticks_array[ut_vtable_stubs], active);
print_ticks("Unknown: null method", unknown_ticks_array[ut_null_method], active);
print_ticks("Unknown: running frame", unknown_ticks_array[ut_running_frame], active);
print_ticks("Unknown: calling frame", unknown_ticks_array[ut_calling_frame], active);
print_ticks("Unknown: no pc", unknown_ticks_array[ut_no_pc], active);
print_ticks("Unknown: no last frame", unknown_ticks_array[ut_no_last_Java_frame], active);
print_ticks("Unknown: thread_state", unknown_ticks_array[ut_unknown_thread_state], active);
tty->cr();
}
if (WizardMode) {
tty->print_cr("Node area used: %dKb", (area_top - area_bottom) / 1024);
}
reset();
}
/*
ThreadProfiler::print_unknown(){
if (table == NULL) {
return;
}
if (thread_ticks <= 0) {
return;
}
} */
void FlatProfiler::print(int unused) {
ResourceMark rm;
if (thread_profiler != NULL) {
thread_profiler->print("All threads");
} else {
MutexLocker tl(Threads_lock);
for (JavaThread* tp = Threads::first(); tp != NULL; tp = tp->next()) {
ThreadProfiler* pp = tp->get_thread_profiler();
if (pp != NULL) {
pp->print(tp->get_thread_name());
}
}
}
if (ProfilerPrintByteCodeStatistics) {
print_byte_code_statistics();
}
if (non_method_ticks() > 0) {
tty->cr();
tty->print_cr("Global summary of %3.2f seconds:", timer.seconds());
print_ticks("Received ticks", received_ticks, received_ticks);
print_ticks("Received GC ticks", received_gc_ticks, received_ticks);
print_ticks("Compilation", compiler_ticks, received_ticks);
print_ticks("Deoptimization", deopt_ticks, received_ticks);
print_ticks("Other VM operations", vm_operation_ticks, received_ticks);
#ifndef PRODUCT
print_ticks("Blocked ticks", blocked_ticks, received_ticks);
print_ticks("Threads_lock blocks", threads_lock_ticks, received_ticks);
print_ticks("Delivered ticks", delivered_ticks, received_ticks);
print_ticks("All ticks", all_ticks, received_ticks);
#endif
print_ticks("Class loader", class_loader_ticks, received_ticks);
print_ticks("Extra ", extra_ticks, received_ticks);
print_ticks("Interpreter", interpreter_ticks, received_ticks);
print_ticks("Unknown code", unknown_ticks, received_ticks);
}
PCRecorder::print();
if(ProfileVM){
tty->cr();
vm_thread_profiler->print("VM Thread");
}
}
void IntervalData::print_header(outputStream* st) {
st->print("i/c/n/g");
}
void IntervalData::print_data(outputStream* st) {
st->print("%d/%d/%d/%d", interpreted(), compiled(), native(), compiling());
}
void FlatProfiler::interval_record_thread(ThreadProfiler* tp) {
IntervalData id = tp->interval_data();
int total = id.total();
tp->interval_data_ref()->reset();
// Insertion sort the data, if it's relevant.
for (int i = 0; i < interval_print_size; i += 1) {
if (total > interval_data[i].total()) {
for (int j = interval_print_size - 1; j > i; j -= 1) {
interval_data[j] = interval_data[j-1];
}
interval_data[i] = id;
break;
}
}
}
void FlatProfiler::interval_print() {
if ((interval_data[0].total() > 0)) {
tty->stamp();
tty->print("\t");
IntervalData::print_header(tty);
for (int i = 0; i < interval_print_size; i += 1) {
if (interval_data[i].total() > 0) {
tty->print("\t");
interval_data[i].print_data(tty);
}
}
tty->cr();
}
}
void FlatProfiler::interval_reset() {
for (int i = 0; i < interval_print_size; i += 1) {
interval_data[i].reset();
}
}
void ThreadProfiler::oops_do(OopClosure* f) {
if (table == NULL) return;
for(int index = 0; index < table_size; index++) {
for(ProfilerNode* node = table[index]; node; node = node->next())
node->oops_do(f);
}
}
void FlatProfiler::oops_do(OopClosure* f) {
if (thread_profiler != NULL) {
thread_profiler->oops_do(f);
} else {
for (JavaThread* tp = Threads::first(); tp != NULL; tp = tp->next()) {
ThreadProfiler* pp = tp->get_thread_profiler();
if (pp != NULL) {
pp->oops_do(f);
}
}
}
}