diff --git a/src/hotspot/cpu/aarch64/codeBuffer_aarch64.cpp b/src/hotspot/cpu/aarch64/codeBuffer_aarch64.cpp index 4257782fdc2..a4213707afb 100644 --- a/src/hotspot/cpu/aarch64/codeBuffer_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/codeBuffer_aarch64.cpp @@ -26,6 +26,56 @@ #include "asm/codeBuffer.inline.hpp" #include "asm/macroAssembler.hpp" -bool CodeBuffer::pd_finalize_stubs() { - return emit_shared_stubs_to_interp(this, _shared_stub_to_interp_requests); +void CodeBuffer::share_trampoline_for(address dest, int caller_offset) { + if (_shared_trampoline_requests == nullptr) { + constexpr unsigned init_size = 8; + constexpr unsigned max_size = 256; + _shared_trampoline_requests = new SharedTrampolineRequests(init_size, max_size); + } + + bool created; + Offsets* offsets = _shared_trampoline_requests->put_if_absent(dest, &created); + if (created) { + _shared_trampoline_requests->maybe_grow(); + } + offsets->add(caller_offset); + _finalize_stubs = true; +} + +static bool emit_shared_trampolines(CodeBuffer* cb, CodeBuffer::SharedTrampolineRequests* requests) { + if (requests == nullptr) { + return true; + } + + MacroAssembler masm(cb); + + bool p_succeeded = true; + auto emit = [&](address dest, const CodeBuffer::Offsets &offsets) { + masm.set_code_section(cb->stubs()); + masm.align(wordSize); + + LinkedListIterator it(offsets.head()); + int offset = *it.next(); + for (; !it.is_empty(); offset = *it.next()) { + masm.relocate(trampoline_stub_Relocation::spec(cb->insts()->start() + offset)); + } + masm.set_code_section(cb->insts()); + + address stub = masm.emit_trampoline_stub(offset, dest); + if (stub == nullptr) { + ciEnv::current()->record_failure("CodeCache is full"); + p_succeeded = false; + } + + return p_succeeded; + }; + + requests->iterate(emit); + + return p_succeeded; +} + +bool CodeBuffer::pd_finalize_stubs() { + return emit_shared_stubs_to_interp(this, _shared_stub_to_interp_requests) + && emit_shared_trampolines(this, _shared_trampoline_requests); } diff --git a/src/hotspot/cpu/aarch64/codeBuffer_aarch64.hpp b/src/hotspot/cpu/aarch64/codeBuffer_aarch64.hpp index f6b1241d4f1..e5c088bf497 100644 --- a/src/hotspot/cpu/aarch64/codeBuffer_aarch64.hpp +++ b/src/hotspot/cpu/aarch64/codeBuffer_aarch64.hpp @@ -34,4 +34,6 @@ public: void flush_bundle(bool start_new_bundle) {} static constexpr bool supports_shared_stubs() { return true; } + void share_trampoline_for(address dest, int caller_offset); + #endif // CPU_AARCH64_CODEBUFFER_AARCH64_HPP diff --git a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp index 72d2103fc6a..8d1f99dddc1 100644 --- a/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp +++ b/src/hotspot/cpu/aarch64/macroAssembler_aarch64.cpp @@ -878,10 +878,15 @@ address MacroAssembler::trampoline_call(Address entry, CodeBuffer* cbuf) { if (!in_scratch_emit_size()) { // We don't want to emit a trampoline if C2 is generating dummy // code during its branch shortening phase. - address stub = emit_trampoline_stub(offset(), target); - if (stub == NULL) { - postcond(pc() == badAddress); - return NULL; // CodeCache is full + if (entry.rspec().type() == relocInfo::runtime_call_type) { + assert(CodeBuffer::supports_shared_stubs(), "must support shared stubs"); + code()->share_trampoline_for(entry.target(), offset()); + } else { + address stub = emit_trampoline_stub(offset(), target); + if (stub == NULL) { + postcond(pc() == badAddress); + return NULL; // CodeCache is full + } } } target = pc(); diff --git a/src/hotspot/share/asm/codeBuffer.hpp b/src/hotspot/share/asm/codeBuffer.hpp index 4cad3b4d30e..d026f97084f 100644 --- a/src/hotspot/share/asm/codeBuffer.hpp +++ b/src/hotspot/share/asm/codeBuffer.hpp @@ -31,6 +31,8 @@ #include "utilities/align.hpp" #include "utilities/debug.hpp" #include "utilities/growableArray.hpp" +#include "utilities/linkedlist.hpp" +#include "utilities/resizeableResourceHash.hpp" #include "utilities/macros.hpp" class PhaseCFG; @@ -398,6 +400,9 @@ class CodeBuffer: public StackObj DEBUG_ONLY(COMMA private Scrubber) { SECT_LIMIT, SECT_NONE = -1 }; + typedef LinkedListImpl Offsets; + typedef ResizeableResourceHashtable SharedTrampolineRequests; + private: enum { sect_bits = 2, // assert (SECT_LIMIT <= (1< command = new ArrayList(); + command.add(compiler); + command.add("-XX:+UnlockDiagnosticVMOptions"); + command.add("-Xbatch"); + command.add("-XX:+PrintRelocations"); + command.add("-XX:CompileCommand=compileonly," + testClassName + "::" + "test"); + command.add("-XX:CompileCommand=dontinline," + testClassName + "::" + "test"); + command.add("-XX:CompileCommand=dontinline," + testClassName + "::" + "log"); + command.add(testClassName); + command.add("a"); + + ProcessBuilder pb = ProcessTools.createJavaProcessBuilder(command); + + OutputAnalyzer analyzer = new OutputAnalyzer(pb.start()); + + analyzer.shouldHaveExitValue(0); + + System.out.println(analyzer.getOutput()); + + checkOutput(analyzer); + } + + public static void main(String[] args) throws Exception { + List compilers = List.of("-XX:-TieredCompilation" /* C2 */); + List tests = List.of("StaticMethodTest"); + for (String compiler : compilers) { + for (String test : tests) { + runTest(compiler, test); + } + } + } + + private static String skipTo(Iterator iter, String substring) { + while (iter.hasNext()) { + String nextLine = iter.next(); + if (nextLine.contains(substring)) { + return nextLine; + } + } + return null; + } + + private static void checkOutput(OutputAnalyzer output) { + List addrs = Pattern.compile("\\(trampoline_stub\\) addr=(\\w+) .*\\[trampoline owner") + .matcher(output.getStdout()) + .results() + .map(m -> m.group(1)) + .collect(Collectors.toList()); + if (addrs.stream().distinct().count() >= addrs.size()) { + throw new RuntimeException("No stubs reused"); + } + } + + public static class StaticMethodTest { + private static void log(int i, String msg) { + } + + static void test(int i, String[] args) { + if (i % args.length == 0) { + log(i, "args[0] = " + args[0]); + } else { + log(i, "No args"); + } + } + + public static void main(String[] args) { + for (int i = 1; i < ITERATIONS_TO_HEAT_LOOP; ++i) { + test(i, args); + } + } + } +}